OpenDILabCommunity
/

HalfCheetah-v3-SAC

@@ -11,16 +11,11 @@ exp_config = {
             'cfg_type': 'BaseEnvManagerDict'
         },
         'stop_value': 12000,
         'env_id': 'HalfCheetah-v3',
-        'norm_obs': {
-            'use_norm': False
-        },
-        'norm_reward': {
-            'use_norm': False
-        },
         'collector_env_num': 1,
         'evaluator_env_num': 8,
-        'n_evaluator_episode': 8
     },
     'policy': {
         'model': {
@@ -74,9 +69,10 @@ exp_config = {
                     'render_freq': -1,
                     'mode': 'train_iter'
                 },
                 'cfg_type': 'InteractionSerialEvaluatorDict',
-                'n_episode': 8,
-                'stop_value': 12000
             }
         },
         'other': {
@@ -85,7 +81,7 @@ exp_config = {
             }
         },
         'on_policy': False,
-        'cuda': False,
         'multi_gpu': False,
         'bp_update_sync': True,
         'traj_len_inf': False,

             'cfg_type': 'BaseEnvManagerDict'
         },
         'stop_value': 12000,
+        'n_evaluator_episode': 8,
         'env_id': 'HalfCheetah-v3',
         'collector_env_num': 1,
         'evaluator_env_num': 8,
+        'env_wrapper': 'mujoco_default'
     },
     'policy': {
         'model': {
                     'render_freq': -1,
                     'mode': 'train_iter'
                 },
+                'figure_path': None,
                 'cfg_type': 'InteractionSerialEvaluatorDict',
+                'stop_value': 12000,
+                'n_episode': 8
             }
         },
         'other': {
             }
         },
         'on_policy': False,
+        'cuda': True,
         'multi_gpu': False,
         'bp_update_sync': True,
         'traj_len_inf': False,