==== CONFIG ==== cache_dir: null solver: _target_: stable_worldmodel.solver.CEMSolver model: ??? batch_size: 1 num_samples: 300 var_scale: 1.0 n_steps: 30 topk: 30 device: cuda seed: ${seed} world: env_name: swm/TwoRoom-v1 num_envs: ${eval.num_eval} max_episode_steps: 100 history_size: 1 frame_skip: 1 seed: 42 policy: two-room/tworoom/lejepa dataset: stats: ${eval.dataset_name} keys_to_cache: - action - proprio plan_config: horizon: 5 receding_horizon: 5 action_block: 5 eval: num_eval: 50 goal_offset_steps: 25 eval_budget: 50 img_size: 224 dataset_name: tworoom callables: - method: _set_state args: state: value: proprio - method: _set_goal_state args: goal_state: value: goal_proprio output: filename: tworoom_results.txt ==== RESULTS ==== metrics: {'success_rate': 88.0, 'episode_successes': array([ True, False, True, False, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True]), 'seeds': None} evaluation_time: 133.1857841014862 seconds inference_precision: fp32 ==== CONFIG ==== cache_dir: null solver: _target_: stable_worldmodel.solver.CEMSolver model: ??? batch_size: 1 num_samples: 300 var_scale: 1.0 n_steps: 30 topk: 30 device: cuda seed: ${seed} world: env_name: swm/TwoRoom-v1 num_envs: ${eval.num_eval} max_episode_steps: 100 history_size: 1 frame_skip: 1 seed: 42 policy: two-room/tworoom/lejepa dataset: stats: ${eval.dataset_name} keys_to_cache: - action - proprio plan_config: horizon: 5 receding_horizon: 5 action_block: 5 eval: num_eval: 50 goal_offset_steps: 25 eval_budget: 50 img_size: 224 dataset_name: tworoom callables: - method: _set_state args: state: value: proprio - method: _set_goal_state args: goal_state: value: goal_proprio output: filename: tworoom_results.txt ==== RESULTS ==== metrics: {'success_rate': 88.0, 'episode_successes': array([ True, False, True, False, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True]), 'seeds': None} evaluation_time: 131.6325900554657 seconds inference_precision: fp32 ==== CONFIG ==== cache_dir: null solver: _target_: stable_worldmodel.solver.CEMSolver model: ??? batch_size: 1 num_samples: 300 var_scale: 1.0 n_steps: 30 topk: 30 device: cuda seed: ${seed} world: env_name: swm/TwoRoom-v1 num_envs: ${eval.num_eval} max_episode_steps: 100 history_size: 1 frame_skip: 1 seed: 42 policy: two-room/tworoom/lejepa dataset: stats: ${eval.dataset_name} keys_to_cache: - action - proprio plan_config: horizon: 5 receding_horizon: 5 action_block: 5 eval: num_eval: 50 goal_offset_steps: 25 eval_budget: 50 img_size: 224 dataset_name: tworoom callables: - method: _set_state args: state: value: proprio - method: _set_goal_state args: goal_state: value: goal_proprio output: filename: tworoom_results.txt ==== RESULTS ==== metrics: {'success_rate': 88.0, 'episode_successes': array([ True, False, True, False, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True]), 'seeds': None} evaluation_time: 119.98270344734192 seconds inference_precision: fp32 ==== CONFIG ==== cache_dir: null solver: _target_: stable_worldmodel.solver.CEMSolver model: ??? batch_size: 1 num_samples: 300 var_scale: 1.0 n_steps: 30 topk: 30 device: cuda seed: ${seed} world: env_name: swm/TwoRoom-v1 num_envs: ${eval.num_eval} max_episode_steps: 100 history_size: 1 frame_skip: 1 seed: 42 policy: two-room/tworoom/lejepa dataset: stats: ${eval.dataset_name} keys_to_cache: - action - proprio plan_config: horizon: 5 receding_horizon: 5 action_block: 5 eval: num_eval: 50 goal_offset_steps: 25 eval_budget: 50 img_size: 224 dataset_name: tworoom callables: - method: _set_state args: state: value: proprio - method: _set_goal_state args: goal_state: value: goal_proprio output: filename: tworoom_results.txt ==== RESULTS ==== metrics: {'success_rate': 88.0, 'episode_successes': array([ True, False, True, False, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True]), 'seeds': None} evaluation_time: 121.47896695137024 seconds inference_precision: fp32 ==== CONFIG ==== cache_dir: null solver: _target_: stable_worldmodel.solver.CEMSolver model: ??? batch_size: 1 num_samples: 300 var_scale: 1.0 n_steps: 30 topk: 30 device: cuda seed: ${seed} world: env_name: swm/TwoRoom-v1 num_envs: ${eval.num_eval} max_episode_steps: 100 history_size: 1 frame_skip: 1 seed: 42 policy: two-room/tworoom/lejepa inference_precision: bf16 dataset: stats: ${eval.dataset_name} keys_to_cache: - action - proprio plan_config: horizon: 5 receding_horizon: 5 action_block: 5 eval: num_eval: 50 goal_offset_steps: 25 eval_budget: 50 img_size: 224 dataset_name: tworoom callables: - method: _set_state args: state: value: proprio - method: _set_goal_state args: goal_state: value: goal_proprio output: filename: tworoom_results.txt ==== RESULTS ==== metrics: {'success_rate': 84.0, 'episode_successes': array([ True, False, True, False, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, False, True, True, True, False, True, True, False, False, True, True, True, True, True, True, True, True, True, True]), 'seeds': None} evaluation_time: 97.36299586296082 seconds inference_precision: bf16 ==== CONFIG ==== cache_dir: null solver: _target_: stable_worldmodel.solver.CEMSolver model: ??? batch_size: 1 num_samples: 300 var_scale: 1.0 n_steps: 30 topk: 30 device: cuda seed: ${seed} world: env_name: swm/TwoRoom-v1 num_envs: ${eval.num_eval} max_episode_steps: 100 history_size: 1 frame_skip: 1 seed: 42 policy: two-room/tworoom/lejepa inference_precision: fp16 dataset: stats: ${eval.dataset_name} keys_to_cache: - action - proprio plan_config: horizon: 5 receding_horizon: 5 action_block: 5 eval: num_eval: 50 goal_offset_steps: 25 eval_budget: 50 img_size: 224 dataset_name: tworoom callables: - method: _set_state args: state: value: proprio - method: _set_goal_state args: goal_state: value: goal_proprio output: filename: tworoom_results.txt ==== RESULTS ==== metrics: {'success_rate': 90.0, 'episode_successes': array([ True, False, True, False, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True]), 'seeds': None} evaluation_time: 94.01083040237427 seconds inference_precision: fp16 ==== CONFIG ==== cache_dir: null solver: _target_: stable_worldmodel.solver.CEMSolver model: ??? batch_size: 1 num_samples: 300 var_scale: 1.0 n_steps: 30 topk: 30 device: cuda seed: ${seed} world: env_name: swm/TwoRoom-v1 num_envs: ${eval.num_eval} max_episode_steps: 100 history_size: 1 frame_skip: 1 seed: 42 policy: two-room/tworoom/lejepa inference_precision: fp16 dataset: stats: ${eval.dataset_name} keys_to_cache: - action - proprio plan_config: horizon: 5 receding_horizon: 5 action_block: 5 eval: num_eval: 50 goal_offset_steps: 25 eval_budget: 50 img_size: 224 dataset_name: tworoom callables: - method: _set_state args: state: value: proprio - method: _set_goal_state args: goal_state: value: goal_proprio output: filename: tworoom_results.txt ==== RESULTS ==== metrics: {'success_rate': 90.0, 'episode_successes': array([ True, False, True, False, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True]), 'seeds': None} evaluation_time: 89.50024104118347 seconds inference_precision: fp16 ==== CONFIG ==== cache_dir: null solver: _target_: stable_worldmodel.solver.CEMSolver model: ??? batch_size: 1 num_samples: 300 var_scale: 1.0 n_steps: 30 topk: 30 device: cuda seed: ${seed} world: env_name: swm/TwoRoom-v1 num_envs: ${eval.num_eval} max_episode_steps: 100 history_size: 1 frame_skip: 1 seed: 42 policy: two-room/tworoom/lejepa inference_precision: fp16 dataset: stats: ${eval.dataset_name} keys_to_cache: - action - proprio plan_config: horizon: 5 receding_horizon: 5 action_block: 5 eval: num_eval: 50 goal_offset_steps: 25 eval_budget: 50 img_size: 224 dataset_name: tworoom callables: - method: _set_state args: state: value: proprio - method: _set_goal_state args: goal_state: value: goal_proprio output: filename: tworoom_results.txt ==== RESULTS ==== metrics: {'success_rate': 90.0, 'episode_successes': array([ True, False, True, False, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, True, False, True, True, True, True, True, True, True, True, True, True]), 'seeds': None} evaluation_time: 86.20240807533264 seconds inference_precision: fp16