olm-chat-7b / open_lm /run_bench.sh
henhenhahi111112's picture
Upload folder using huggingface_hub
af6e330 verified
raw
history blame
494 Bytes
#!/bin/bash
BATCHSIZE=1
MODEL="large2048"
EXP_NAME="benchmark-$MODEL"
torchrun --nproc-per-node 1 -m benchmark.main \
--train-data "pipe:aws s3 cp s3://s-laion/redpajama-tars/8192-v1/{0..7}/shard-{0000000..0000300}.tar -" \
--train-num-samples 30720 \
--workers 6 \
--precision amp_bfloat16 \
--grad-checkpointing \
--grad-clip-norm 1 \
--log-every-n-steps 1 \
--fsdp \
--profile \
--batch-size $BATCHSIZE \
--model $MODEL \
--name $EXP_NAME \