18 lines
1.8 KiB
Bash
18 lines
1.8 KiB
Bash
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -na --use_baseline --exp_name halfcheetah_na_baseline
|
|
|
|
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -na --use_baseline --baseline_gradient_steps 3 --exp_name halfcheetah_na_baseline_bgs3
|
|
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -na --use_baseline --baseline_learning_rate 0.001 --exp_name halfcheetah_na_baseline_blr1e-3
|
|
# with reward to go
|
|
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg -na --use_baseline --exp_name halfcheetah_na_rtg_baseline
|
|
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg -na --use_baseline --baseline_gradient_steps 3 --exp_name halfcheetah_na_rtg_baseline_bgs3
|
|
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg -na --use_baseline --baseline_learning_rate 0.001 --exp_name halfcheetah_na_rtg_baseline_blr1e-3
|
|
# Berkely parameters
|
|
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 5 --baseline_learning_rate 0.01 --exp_name halfcheetah_na_rtg_baseline_bgs5_blr1e-2
|
|
# try
|
|
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 10 --exp_name halfcheetah_na_rtg_baseline_bgs10
|
|
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 10 --baseline_learning_rate 0.0001 --exp_name halfcheetah_na_rtg_baseline_bgs10_blr1e-4
|
|
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 8 --baseline_learning_rate 0.001 --exp_name halfcheetah_na_rtg_baseline_bgs10_blr1e-3
|
|
# Extended na
|
|
python run.py --env_name HalfCheetah-v4 -n 300 -b 5000 -na --use_baseline --exp_name halfcheetah_na_baseline_n300
|
|
python run.py --env_name HalfCheetah-v4 -n 300 -b 10000 -na --use_baseline --exp_name halfcheetah_na_lb_baseline
|