Midren
diff --git a/‎outputs/2023-04-23/19-25-50/.hydra/config.yaml‎
Lines changed: 59 additions & 0 deletions b/‎outputs/2023-04-23/19-25-50/.hydra/config.yaml‎
Lines changed: 59 additions & 0 deletions
diff --git a/‎outputs/2023-04-23/19-25-50/.hydra/hydra.yaml‎
Lines changed: 167 additions & 0 deletions b/‎outputs/2023-04-23/19-25-50/.hydra/hydra.yaml‎
Lines changed: 167 additions & 0 deletions
diff --git a/‎outputs/2023-04-23/19-25-50/.hydra/overrides.yaml‎
Lines changed: 1 addition & 0 deletions b/‎outputs/2023-04-23/19-25-50/.hydra/overrides.yaml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎outputs/2023-04-23/19-25-50/train.log‎ b/‎outputs/2023-04-23/19-25-50/train.log‎
diff --git a/‎outputs/2023-04-23/19-29-44/.hydra/config.yaml‎
Lines changed: 59 additions & 0 deletions b/‎outputs/2023-04-23/19-29-44/.hydra/config.yaml‎
Lines changed: 59 additions & 0 deletions
@@ -0,0 +1,59 @@
+agent:
+  _target_: rl_sandbox.agents.DreamerV2
+  layer_norm: true
+  batch_cluster_size: 50
+  latent_dim: 16
+  latent_classes: 16
+  rssm_dim: 40
+  slots_num: 8
+  kl_loss_scale: 8.0
+  kl_loss_balancing: 0.8
+  kl_loss_free_nats: 0.0
+  world_model_lr: 0.0003
+  world_model_predict_discount: false
+  discount_factor: 0.999
+  imagination_horizon: 15
+  actor_lr: 8.0e-05
+  actor_reinforce_fraction: null
+  actor_entropy_scale: 0.0001
+  critic_lr: 8.0e-05
+  critic_value_target_lambda: 0.95
+  critic_update_interval: 100
+  critic_soft_update_fraction: 1
+  discrete_rssm: false
+  decode_vit: false
+  vit_l2_ratio: 1.0
+  encode_vit: false
+env:
+  _target_: rl_sandbox.utils.env.DmEnv
+  domain_name: cartpole
+  task_name: swingup
+  run_on_pixels: true
+  obs_res:
+  - 64
+  - 64
+  camera_id: 0
+  repeat_action_num: 2
+  transforms: []
+training:
+  steps: 1000000.0
+  prefill: 1000
+  batch_size: 16
+  pretrain: 100
+  prioritize_ends: false
+  train_every: 5
+  save_checkpoint_every: 2000000.0
+  val_logs_every: 100.0
+  checkpoint_path: null
+seed: 42
+device_type: cuda
+logger:
+  type: null
+  message: Cartpole 8 slots, reduced warmup, 192 n_dim, correct prev_slots, 8x KL,
+    0 nats, 40 rssm dims, 16x16 stoch
+  log_grads: false
+validation:
+  rollout_num: 5
+  visualize: true
+debug:
+  profiler: false
@@ -0,0 +1,167 @@
+hydra:
+  run:
+    dir: outputs/${now:%Y-%m-%d}/${now:%H-%M-%S}
+  sweep:
+    dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
+    subdir: ${hydra.job.num}
+  launcher:
+    _target_: hydra_plugins.hydra_joblib_launcher.joblib_launcher.JoblibLauncher
+    n_jobs: 1
+    backend: null
+    prefer: processes
+    require: null
+    verbose: 0
+    timeout: null
+    pre_dispatch: 2*n_jobs
+    batch_size: auto
+    temp_folder: null
+    max_nbytes: null
+    mmap_mode: r
+  sweeper:
+    _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
+    max_batch_size: null
+    params: null
+  help:
+    app_name: ${hydra.job.name}
+    header: '${hydra.help.app_name} is powered by Hydra.
+
+      '
+    footer: 'Powered by Hydra (https://hydra.cc)
+
+      Use --hydra-help to view Hydra specific help
+
+      '
+    template: '${hydra.help.header}
+
+      == Configuration groups ==
+
+      Compose your configuration from those groups (group=option)
+
+
+      $APP_CONFIG_GROUPS
+
+
+      == Config ==
+
+      Override anything in the config (foo.bar=value)
+
+
+      $CONFIG
+
+
+      ${hydra.help.footer}
+
+      '
+  hydra_help:
+    template: 'Hydra (${hydra.runtime.version})
+
+      See https://hydra.cc for more info.
+
+
+      == Flags ==
+
+      $FLAGS_HELP
+
+
+      == Configuration groups ==
+
+      Compose your configuration from those groups (For example, append hydra/job_logging=disabled
+      to command line)
+
+
+      $HYDRA_CONFIG_GROUPS
+
+
+      Use ''--cfg hydra'' to Show the Hydra config.
+
+      '
+    hydra_help: ???
+  hydra_logging:
+    version: 1
+    formatters:
+      simple:
+        format: '[%(asctime)s][HYDRA] %(message)s'
+    handlers:
+      console:
+        class: logging.StreamHandler
+        formatter: simple
+        stream: ext://sys.stdout
+    root:
+      level: INFO
+      handlers:
+      - console
+    loggers:
+      logging_example:
+        level: DEBUG
+    disable_existing_loggers: false
+  job_logging:
+    version: 1
+    formatters:
+      simple:
+        format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
+    handlers:
+      console:
+        class: logging.StreamHandler
+        formatter: simple
+        stream: ext://sys.stdout
+      file:
+        class: logging.FileHandler
+        formatter: simple
+        filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
+    root:
+      level: INFO
+      handlers:
+      - console
+      - file
+    disable_existing_loggers: false
+  env: {}
+  mode: RUN
+  searchpath: []
+  callbacks: {}
+  output_subdir: .hydra
+  overrides:
+    hydra: []
+    task: []
+  job:
+    name: train
+    chdir: null
+    override_dirname: ''
+    id: ???
+    num: ???
+    config_name: config
+    env_set: {}
+    env_copy: []
+    config:
+      override_dirname:
+        kv_sep: '='
+        item_sep: ','
+        exclude_keys: []
+  runtime:
+    version: 1.2.0
+    version_base: '1.2'
+    cwd: /jmain02/home/J2AD019/exk13/rrm37-exk13/rl_sandbox
+    config_sources:
+    - path: hydra.conf
+      schema: pkg
+      provider: hydra
+    - path: /jmain02/home/J2AD019/exk13/rrm37-exk13/rl_sandbox/rl_sandbox/config
+      schema: file
+      provider: main
+    - path: ''
+      schema: structured
+      provider: schema
+    output_dir: /jmain02/home/J2AD019/exk13/rrm37-exk13/rl_sandbox/outputs/2023-04-23/19-25-50
+    choices:
+      training: dm
+      env: dm_cartpole
+      agent: dreamer_v2
+      hydra/env: default
+      hydra/callbacks: null
+      hydra/job_logging: default
+      hydra/hydra_logging: default
+      hydra/hydra_help: default
+      hydra/help: default
+      hydra/sweeper: basic
+      hydra/launcher: joblib
+      hydra/output: default
+  verbose: false
@@ -0,0 +1 @@
+[]
@@ -0,0 +1,59 @@
+agent:
+  _target_: rl_sandbox.agents.DreamerV2
+  layer_norm: true
+  batch_cluster_size: 50
+  latent_dim: 16
+  latent_classes: 16
+  rssm_dim: 40
+  slots_num: 8
+  kl_loss_scale: 8.0
+  kl_loss_balancing: 0.8
+  kl_loss_free_nats: 0.0
+  world_model_lr: 0.0003
+  world_model_predict_discount: false
+  discount_factor: 0.999
+  imagination_horizon: 15
+  actor_lr: 8.0e-05
+  actor_reinforce_fraction: null
+  actor_entropy_scale: 0.0001
+  critic_lr: 8.0e-05
+  critic_value_target_lambda: 0.95
+  critic_update_interval: 100
+  critic_soft_update_fraction: 1
+  discrete_rssm: false
+  decode_vit: false
+  vit_l2_ratio: 1.0
+  encode_vit: false
+env:
+  _target_: rl_sandbox.utils.env.DmEnv
+  domain_name: cartpole
+  task_name: swingup
+  run_on_pixels: true
+  obs_res:
+  - 64
+  - 64
+  camera_id: 0
+  repeat_action_num: 2
+  transforms: []
+training:
+  steps: 1000000.0
+  prefill: 1000
+  batch_size: 16
+  pretrain: 100
+  prioritize_ends: false
+  train_every: 5
+  save_checkpoint_every: 2000000.0
+  val_logs_every: 100.0
+  checkpoint_path: null
+seed: 42
+device_type: cuda
+logger:
+  type: null
+  message: Cartpole 8 slots, reduced warmup, 384 n_dim, correct prev_slots, 8x KL,
+    0 nats, 40 rssm dims, 16x16 stoch
+  log_grads: false
+validation:
+  rollout_num: 5
+  visualize: true
+debug:
+  profiler: false