ding.config.example.SAC.gym_pendulum_v1¶
ding.config.example.SAC.gym_pendulum_v1
¶
Full Source Code
../ding/config/example/SAC/gym_pendulum_v1.py
1from easydict import EasyDict 2import ding.envs.gym_env 3 4cfg = dict( 5 exp_name='Pendulum-v1-SAC', 6 seed=0, 7 env=dict( 8 env_id='Pendulum-v1', 9 collector_env_num=10, 10 evaluator_env_num=8, 11 n_evaluator_episode=8, 12 stop_value=-250, 13 act_scale=True, 14 ), 15 policy=dict( 16 cuda=True, 17 priority=False, 18 random_collect_size=1000, 19 model=dict( 20 obs_shape=3, 21 action_shape=1, 22 twin_critic=True, 23 action_space='reparameterization', 24 actor_head_hidden_size=128, 25 critic_head_hidden_size=128, 26 ), 27 learn=dict( 28 update_per_collect=1, 29 batch_size=128, 30 learning_rate_q=0.001, 31 learning_rate_policy=0.001, 32 learning_rate_alpha=0.0003, 33 ignore_done=True, 34 target_theta=0.005, 35 discount_factor=0.99, 36 auto_alpha=True, 37 ), 38 collect=dict(n_sample=10, ), 39 eval=dict(evaluator=dict(eval_freq=100, )), 40 other=dict(replay_buffer=dict(replay_buffer_size=100000, ), ), 41 ), 42 wandb_logger=dict( 43 gradient_logger=True, video_logger=True, plot_logger=True, action_logger=True, return_logger=False 44 ), 45) 46 47cfg = EasyDict(cfg) 48 49env = ding.envs.gym_env.env