diff --git a/train_ppo.sh b/train_ppo.sh new file mode 100644 index 000000000..6b83bb080 --- /dev/null +++ b/train_ppo.sh @@ -0,0 +1,24 @@ +#!/bin/bash + +if [ -z "$1" ]; then + echo "Usage: $0 " + exit 1 +fi + +PROJECT=sigmaban-standup +ENV=sigmaban-standup-v0 +ALGO=ppo +TAGS=standup +EXP_ID=`python next_run_id.py $ALGO $ENV` +RUN_NAME="${HOSTNAME}_${EXP_ID}_$1" + +# killall -9 python + +nohup python train.py --run-name="$RUN_NAME" \ + --env=$ENV --algo=$ALGO --track --wandb-project-name $PROJECT \ + --eval-freq=150000 \ + --eval-episodes=100 --n-eval-envs=4 --vec-env=subproc \ + -tags exp-$EXP_ID $TAGS h-$HOSTNAME > $HOSTNAME.out & + +tail -f $HOSTNAME.out +