OpenDILabCommunity
/

Pendulum-v1-SAC

@@ -11,10 +11,11 @@ exp_config = {
             'cfg_type': 'BaseEnvManagerDict'
         },
         'stop_value': -250,
         'collector_env_num': 10,
         'evaluator_env_num': 8,
-        'act_scale': True,
-        'n_evaluator_episode': 8
     },
     'policy': {
         'model': {
@@ -67,9 +68,10 @@ exp_config = {
                     'render_freq': -1,
                     'mode': 'train_iter'
                 },
                 'cfg_type': 'InteractionSerialEvaluatorDict',
-                'n_episode': 8,
-                'stop_value': -250
             }
         },
         'other': {
@@ -78,7 +80,7 @@ exp_config = {
             }
         },
         'on_policy': False,
-        'cuda': False,
         'multi_gpu': False,
         'bp_update_sync': True,
         'traj_len_inf': False,

             'cfg_type': 'BaseEnvManagerDict'
         },
         'stop_value': -250,
+        'n_evaluator_episode': 8,
+        'env_id': 'Pendulum-v1',
         'collector_env_num': 10,
         'evaluator_env_num': 8,
+        'act_scale': True
     },
     'policy': {
         'model': {
                     'render_freq': -1,
                     'mode': 'train_iter'
                 },
+                'figure_path': None,
                 'cfg_type': 'InteractionSerialEvaluatorDict',
+                'stop_value': -250,
+                'n_episode': 8
             }
         },
         'other': {
             }
         },
         'on_policy': False,
+        'cuda': True,
         'multi_gpu': False,
         'bp_update_sync': True,
         'traj_len_inf': False,