Skip to content

Commit 43cd551

Browse files
committed
Fixed per slot rec loss
1 parent 8369018 commit 43cd551

File tree

1,203 files changed

+83969
-12
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

1,203 files changed

+83969
-12
lines changed
Lines changed: 59 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,59 @@
1+
agent:
2+
_target_: rl_sandbox.agents.DreamerV2
3+
layer_norm: true
4+
batch_cluster_size: 50
5+
latent_dim: 16
6+
latent_classes: 16
7+
rssm_dim: 40
8+
slots_num: 8
9+
kl_loss_scale: 8.0
10+
kl_loss_balancing: 0.8
11+
kl_loss_free_nats: 0.0
12+
world_model_lr: 0.0003
13+
world_model_predict_discount: false
14+
discount_factor: 0.999
15+
imagination_horizon: 15
16+
actor_lr: 8.0e-05
17+
actor_reinforce_fraction: null
18+
actor_entropy_scale: 0.0001
19+
critic_lr: 8.0e-05
20+
critic_value_target_lambda: 0.95
21+
critic_update_interval: 100
22+
critic_soft_update_fraction: 1
23+
discrete_rssm: false
24+
decode_vit: false
25+
vit_l2_ratio: 1.0
26+
encode_vit: false
27+
env:
28+
_target_: rl_sandbox.utils.env.DmEnv
29+
domain_name: cartpole
30+
task_name: swingup
31+
run_on_pixels: true
32+
obs_res:
33+
- 64
34+
- 64
35+
camera_id: 0
36+
repeat_action_num: 2
37+
transforms: []
38+
training:
39+
steps: 1000000.0
40+
prefill: 1000
41+
batch_size: 16
42+
pretrain: 100
43+
prioritize_ends: false
44+
train_every: 5
45+
save_checkpoint_every: 2000000.0
46+
val_logs_every: 100.0
47+
checkpoint_path: null
48+
seed: 42
49+
device_type: cuda
50+
logger:
51+
type: null
52+
message: Cartpole 8 slots, reduced warmup, 192 n_dim, correct prev_slots, 8x KL,
53+
0 nats, 40 rssm dims, 16x16 stoch
54+
log_grads: false
55+
validation:
56+
rollout_num: 5
57+
visualize: true
58+
debug:
59+
profiler: false
Lines changed: 167 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,167 @@
1+
hydra:
2+
run:
3+
dir: outputs/${now:%Y-%m-%d}/${now:%H-%M-%S}
4+
sweep:
5+
dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
6+
subdir: ${hydra.job.num}
7+
launcher:
8+
_target_: hydra_plugins.hydra_joblib_launcher.joblib_launcher.JoblibLauncher
9+
n_jobs: 1
10+
backend: null
11+
prefer: processes
12+
require: null
13+
verbose: 0
14+
timeout: null
15+
pre_dispatch: 2*n_jobs
16+
batch_size: auto
17+
temp_folder: null
18+
max_nbytes: null
19+
mmap_mode: r
20+
sweeper:
21+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
22+
max_batch_size: null
23+
params: null
24+
help:
25+
app_name: ${hydra.job.name}
26+
header: '${hydra.help.app_name} is powered by Hydra.
27+
28+
'
29+
footer: 'Powered by Hydra (https://hydra.cc)
30+
31+
Use --hydra-help to view Hydra specific help
32+
33+
'
34+
template: '${hydra.help.header}
35+
36+
== Configuration groups ==
37+
38+
Compose your configuration from those groups (group=option)
39+
40+
41+
$APP_CONFIG_GROUPS
42+
43+
44+
== Config ==
45+
46+
Override anything in the config (foo.bar=value)
47+
48+
49+
$CONFIG
50+
51+
52+
${hydra.help.footer}
53+
54+
'
55+
hydra_help:
56+
template: 'Hydra (${hydra.runtime.version})
57+
58+
See https://hydra.cc for more info.
59+
60+
61+
== Flags ==
62+
63+
$FLAGS_HELP
64+
65+
66+
== Configuration groups ==
67+
68+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
69+
to command line)
70+
71+
72+
$HYDRA_CONFIG_GROUPS
73+
74+
75+
Use ''--cfg hydra'' to Show the Hydra config.
76+
77+
'
78+
hydra_help: ???
79+
hydra_logging:
80+
version: 1
81+
formatters:
82+
simple:
83+
format: '[%(asctime)s][HYDRA] %(message)s'
84+
handlers:
85+
console:
86+
class: logging.StreamHandler
87+
formatter: simple
88+
stream: ext://sys.stdout
89+
root:
90+
level: INFO
91+
handlers:
92+
- console
93+
loggers:
94+
logging_example:
95+
level: DEBUG
96+
disable_existing_loggers: false
97+
job_logging:
98+
version: 1
99+
formatters:
100+
simple:
101+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
102+
handlers:
103+
console:
104+
class: logging.StreamHandler
105+
formatter: simple
106+
stream: ext://sys.stdout
107+
file:
108+
class: logging.FileHandler
109+
formatter: simple
110+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
111+
root:
112+
level: INFO
113+
handlers:
114+
- console
115+
- file
116+
disable_existing_loggers: false
117+
env: {}
118+
mode: RUN
119+
searchpath: []
120+
callbacks: {}
121+
output_subdir: .hydra
122+
overrides:
123+
hydra: []
124+
task: []
125+
job:
126+
name: train
127+
chdir: null
128+
override_dirname: ''
129+
id: ???
130+
num: ???
131+
config_name: config
132+
env_set: {}
133+
env_copy: []
134+
config:
135+
override_dirname:
136+
kv_sep: '='
137+
item_sep: ','
138+
exclude_keys: []
139+
runtime:
140+
version: 1.2.0
141+
version_base: '1.2'
142+
cwd: /jmain02/home/J2AD019/exk13/rrm37-exk13/rl_sandbox
143+
config_sources:
144+
- path: hydra.conf
145+
schema: pkg
146+
provider: hydra
147+
- path: /jmain02/home/J2AD019/exk13/rrm37-exk13/rl_sandbox/rl_sandbox/config
148+
schema: file
149+
provider: main
150+
- path: ''
151+
schema: structured
152+
provider: schema
153+
output_dir: /jmain02/home/J2AD019/exk13/rrm37-exk13/rl_sandbox/outputs/2023-04-23/19-25-50
154+
choices:
155+
training: dm
156+
env: dm_cartpole
157+
agent: dreamer_v2
158+
hydra/env: default
159+
hydra/callbacks: null
160+
hydra/job_logging: default
161+
hydra/hydra_logging: default
162+
hydra/hydra_help: default
163+
hydra/help: default
164+
hydra/sweeper: basic
165+
hydra/launcher: joblib
166+
hydra/output: default
167+
verbose: false
Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
[]

outputs/2023-04-23/19-25-50/train.log

Whitespace-only changes.
Lines changed: 59 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,59 @@
1+
agent:
2+
_target_: rl_sandbox.agents.DreamerV2
3+
layer_norm: true
4+
batch_cluster_size: 50
5+
latent_dim: 16
6+
latent_classes: 16
7+
rssm_dim: 40
8+
slots_num: 8
9+
kl_loss_scale: 8.0
10+
kl_loss_balancing: 0.8
11+
kl_loss_free_nats: 0.0
12+
world_model_lr: 0.0003
13+
world_model_predict_discount: false
14+
discount_factor: 0.999
15+
imagination_horizon: 15
16+
actor_lr: 8.0e-05
17+
actor_reinforce_fraction: null
18+
actor_entropy_scale: 0.0001
19+
critic_lr: 8.0e-05
20+
critic_value_target_lambda: 0.95
21+
critic_update_interval: 100
22+
critic_soft_update_fraction: 1
23+
discrete_rssm: false
24+
decode_vit: false
25+
vit_l2_ratio: 1.0
26+
encode_vit: false
27+
env:
28+
_target_: rl_sandbox.utils.env.DmEnv
29+
domain_name: cartpole
30+
task_name: swingup
31+
run_on_pixels: true
32+
obs_res:
33+
- 64
34+
- 64
35+
camera_id: 0
36+
repeat_action_num: 2
37+
transforms: []
38+
training:
39+
steps: 1000000.0
40+
prefill: 1000
41+
batch_size: 16
42+
pretrain: 100
43+
prioritize_ends: false
44+
train_every: 5
45+
save_checkpoint_every: 2000000.0
46+
val_logs_every: 100.0
47+
checkpoint_path: null
48+
seed: 42
49+
device_type: cuda
50+
logger:
51+
type: null
52+
message: Cartpole 8 slots, reduced warmup, 384 n_dim, correct prev_slots, 8x KL,
53+
0 nats, 40 rssm dims, 16x16 stoch
54+
log_grads: false
55+
validation:
56+
rollout_num: 5
57+
visualize: true
58+
debug:
59+
profiler: false

0 commit comments

Comments
 (0)