This commit is contained in:
Zheyuan Wu
2025-10-14 20:34:47 -05:00
parent 250f763f1f
commit e74aac95e3
517 changed files with 1418 additions and 16701 deletions

View File

@@ -0,0 +1,33 @@
seed: 42
env_name: CartPole-v1
train:
nstep: ${buffer.nstep}
timesteps: 50000
batch_size: 128
test_every: 2500
eps_max: 1
eps_min: 0.05
eps_steps: 12500
start_steps: 0
plot_interval: 2000
eval_interval: 2000
eval_episodes: 10
agent:
gamma: 0.99
lr: 0.002
tau: 0.1
nstep: ${buffer.nstep}
target_update_interval: 3
hidden_size: 64
activation:
_target_: torch.nn.ELU
use_dueling: false
use_double: false
buffer:
capacity: 50000
use_per: false
nstep: 1
gamma: ${agent.gamma}
per_alpha: 0.7
per_beta: 0.4
per_eps: 0.01

154
runs/DQN/.hydra/hydra.yaml Normal file
View File

@@ -0,0 +1,154 @@
hydra:
run:
dir: ./runs/${now:%Y-%m-%d}/${now:%H-%M-%S}_${hydra.job.override_dirname}
sweep:
dir: ./sweeps/${now:%Y-%m-%d}/${now:%H-%M-%S}_${hydra.job.override_dirname}
subdir: ${hydra.job.num}
launcher:
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
sweeper:
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
max_batch_size: null
params: null
help:
app_name: ${hydra.job.name}
header: '${hydra.help.app_name} is powered by Hydra.
'
footer: 'Powered by Hydra (https://hydra.cc)
Use --hydra-help to view Hydra specific help
'
template: '${hydra.help.header}
== Configuration groups ==
Compose your configuration from those groups (group=option)
$APP_CONFIG_GROUPS
== Config ==
Override anything in the config (foo.bar=value)
$CONFIG
${hydra.help.footer}
'
hydra_help:
template: 'Hydra (${hydra.runtime.version})
See https://hydra.cc for more info.
== Flags ==
$FLAGS_HELP
== Configuration groups ==
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
to command line)
$HYDRA_CONFIG_GROUPS
Use ''--cfg hydra'' to Show the Hydra config.
'
hydra_help: ???
hydra_logging:
version: 1
formatters:
simple:
format: '[%(asctime)s][HYDRA] %(message)s'
handlers:
console:
class: logging.StreamHandler
formatter: simple
stream: ext://sys.stdout
root:
level: INFO
handlers:
- console
loggers:
logging_example:
level: DEBUG
disable_existing_loggers: false
job_logging:
version: 1
formatters:
simple:
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
handlers:
console:
class: logging.StreamHandler
formatter: simple
stream: ext://sys.stdout
file:
class: logging.FileHandler
formatter: simple
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
root:
level: INFO
handlers:
- console
- file
disable_existing_loggers: false
env: {}
mode: RUN
searchpath: []
callbacks: {}
output_subdir: .hydra
overrides:
hydra:
- hydra.mode=RUN
task: []
job:
name: main
chdir: true
override_dirname: ''
id: ???
num: ???
config_name: config
env_set: {}
env_copy: []
config:
override_dirname:
kv_sep: '='
item_sep: ','
exclude_keys: []
runtime:
version: 1.3.2
version_base: '1.3'
cwd: D:\Documents\Nextcloud\Documents\Project WUSTL\Academic\2025_Fall\CSE5100\Homeworks\hw2
config_sources:
- path: hydra.conf
schema: pkg
provider: hydra
- path: D:\Documents\Nextcloud\Documents\Project WUSTL\Academic\2025_Fall\CSE5100\Homeworks\hw2\hw2\cfgs
schema: file
provider: main
- path: ''
schema: structured
provider: schema
output_dir: D:\Documents\Nextcloud\Documents\Project WUSTL\Academic\2025_Fall\CSE5100\Homeworks\hw2\runs\2025-10-13\22-40-28_
choices:
hydra/env: default
hydra/callbacks: null
hydra/job_logging: default
hydra/hydra_logging: default
hydra/hydra_help: default
hydra/help: default
hydra/sweeper: basic
hydra/launcher: basic
hydra/output: default
verbose: false

View File

@@ -0,0 +1 @@
[]

BIN
runs/DQN/best_videos.mp4 Normal file

Binary file not shown.

BIN
runs/DQN/final_videos.mp4 Normal file

Binary file not shown.

28
runs/DQN/main.log Normal file
View File

@@ -0,0 +1,28 @@
[2025-10-13 22:40:31,116][__main__][INFO] - Training for 50000 timesteps with NormalQNetwork and NormalReplayBuffer
[2025-10-13 22:40:42,581][core][INFO] - Step: 2000, Eval mean: 262.8, Eval std: 52.92409659125038
[2025-10-13 22:40:54,700][core][INFO] - Step: 4000, Eval mean: 243.4, Eval std: 65.53655468515262
[2025-10-13 22:41:06,329][core][INFO] - Step: 6000, Eval mean: 181.4, Eval std: 57.339689570139804
[2025-10-13 22:41:17,476][core][INFO] - Step: 8000, Eval mean: 98.2, Eval std: 2.638181191654584
[2025-10-13 22:41:28,845][core][INFO] - Step: 10000, Eval mean: 116.9, Eval std: 5.18555686498567
[2025-10-13 22:41:40,462][core][INFO] - Step: 12000, Eval mean: 108.0, Eval std: 3.4641016151377544
[2025-10-13 22:41:52,444][core][INFO] - Step: 14000, Eval mean: 149.4, Eval std: 7.578918128598566
[2025-10-13 22:42:04,993][core][INFO] - Step: 16000, Eval mean: 250.2, Eval std: 12.416118556135006
[2025-10-13 22:42:18,663][core][INFO] - Step: 18000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:42:32,624][core][INFO] - Step: 20000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:42:46,682][core][INFO] - Step: 22000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:43:01,168][core][INFO] - Step: 24000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:43:15,593][core][INFO] - Step: 26000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:43:29,945][core][INFO] - Step: 28000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:43:44,537][core][INFO] - Step: 30000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:43:58,921][core][INFO] - Step: 32000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:44:13,691][core][INFO] - Step: 34000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:44:28,577][core][INFO] - Step: 36000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:44:44,231][core][INFO] - Step: 38000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:44:59,385][core][INFO] - Step: 40000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:45:14,726][core][INFO] - Step: 42000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:45:31,078][core][INFO] - Step: 44000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:45:47,260][core][INFO] - Step: 46000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:46:01,959][core][INFO] - Step: 48000, Eval mean: 166.6, Eval std: 3.7735924528226414
[2025-10-13 22:46:18,821][core][INFO] - Step: 50000, Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:46:40,094][core][INFO] - Final Eval mean: 500.0, Eval std: 0.0
[2025-10-13 22:46:45,564][__main__][INFO] - Finish training with eval mean: 500.0

Binary file not shown.

Binary file not shown.

BIN
runs/DQN/results.png Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 77 KiB