Files
CSE5100H3/hw3/bash/2-4-experiments.sh
Zheyuan Wu 8917fb124f updates
2025-11-02 20:11:37 -06:00

18 lines
1.8 KiB
Bash

python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -na --use_baseline --exp_name halfcheetah_na_baseline
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -na --use_baseline --baseline_gradient_steps 3 --exp_name halfcheetah_na_baseline_bgs3
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -na --use_baseline --baseline_learning_rate 0.001 --exp_name halfcheetah_na_baseline_blr1e-3
# with reward to go
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg -na --use_baseline --exp_name halfcheetah_na_rtg_baseline
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg -na --use_baseline --baseline_gradient_steps 3 --exp_name halfcheetah_na_rtg_baseline_bgs3
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg -na --use_baseline --baseline_learning_rate 0.001 --exp_name halfcheetah_na_rtg_baseline_blr1e-3
# Berkely parameters
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 5 --baseline_learning_rate 0.01 --exp_name halfcheetah_na_rtg_baseline_bgs5_blr1e-2
# try
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 10 --exp_name halfcheetah_na_rtg_baseline_bgs10
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 10 --baseline_learning_rate 0.0001 --exp_name halfcheetah_na_rtg_baseline_bgs10_blr1e-4
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 8 --baseline_learning_rate 0.001 --exp_name halfcheetah_na_rtg_baseline_bgs10_blr1e-3
# Extended na
python run.py --env_name HalfCheetah-v4 -n 300 -b 5000 -na --use_baseline --exp_name halfcheetah_na_baseline_n300
python run.py --env_name HalfCheetah-v4 -n 300 -b 10000 -na --use_baseline --exp_name halfcheetah_na_lb_baseline