This commit is contained in:
Zheyuan Wu
2025-11-02 20:11:37 -06:00
parent 248051db0d
commit 8917fb124f
15 changed files with 43 additions and 21 deletions

View File

@@ -7,4 +7,11 @@ python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg -na --use_baseline -
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg -na --use_baseline --baseline_gradient_steps 3 --exp_name halfcheetah_na_rtg_baseline_bgs3
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg -na --use_baseline --baseline_learning_rate 0.001 --exp_name halfcheetah_na_rtg_baseline_blr1e-3
# Berkely parameters
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 5 --baseline_learning_rate 0.01 --exp_name halfcheetah_na_rtg_baseline_bgs5_blr1e-2
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 5 --baseline_learning_rate 0.01 --exp_name halfcheetah_na_rtg_baseline_bgs5_blr1e-2
# try
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 10 --exp_name halfcheetah_na_rtg_baseline_bgs10
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 10 --baseline_learning_rate 0.0001 --exp_name halfcheetah_na_rtg_baseline_bgs10_blr1e-4
python run.py --env_name HalfCheetah-v4 -n 100 -b 5000 -rtg --use_baseline --baseline_gradient_steps 8 --baseline_learning_rate 0.001 --exp_name halfcheetah_na_rtg_baseline_bgs10_blr1e-3
# Extended na
python run.py --env_name HalfCheetah-v4 -n 300 -b 5000 -na --use_baseline --exp_name halfcheetah_na_baseline_n300
python run.py --env_name HalfCheetah-v4 -n 300 -b 10000 -na --use_baseline --exp_name halfcheetah_na_lb_baseline