source benchmarks/train_loop.sh # export WANDB_PROJECT_NAME="rl-algo-impls" BENCHMARK_MAX_PROCS="${BENCHMARK_MAX_PROCS:-6}" ALGOS=( # "vpg" # "dqn" # "ppo" "a2c" ) ENVS=( # Basic "CartPole-v1" "MountainCar-v0" "MountainCarContinuous-v0" "Acrobot-v1" "LunarLander-v2" "BipedalWalker-v3" # PyBullet "HalfCheetahBulletEnv-v0" "AntBulletEnv-v0" "HopperBulletEnv-v0" "Walker2DBulletEnv-v0" # CarRacing "CarRacing-v0" # Atari "PongNoFrameskip-v4" "BreakoutNoFrameskip-v4" "SpaceInvadersNoFrameskip-v4" "QbertNoFrameskip-v4" ) train_loop "${ALGOS[*]}" "${ENVS[*]}" | xargs -I CMD -P $BENCHMARK_MAX_PROCS bash -c CMD