diff --git a/joyrl/algos/TD3/config.py b/joyrl/algos/TD3/config.py index 6af1356..c8c7506 100644 --- a/joyrl/algos/TD3/config.py +++ b/joyrl/algos/TD3/config.py @@ -1,8 +1,8 @@ class AlgoConfig: def __init__(self) -> None: - self.explore_steps = 1000 # exploration steps before training + self.explore_steps = 100 # exploration steps before training self.policy_freq = 2 # policy update frequency - self.actor_lr = 1e-3 # actor learning rate 3e-4 + self.actor_lr = 1e-4 # actor learning rate 3e-4 self.critic_lr = 1e-3 # critic learning rate self.actor_hidden_dim = 256 # actor hidden layer dimension self.critic_hidden_dim = 256 # critic hidden layer dimension @@ -12,4 +12,4 @@ def __init__(self) -> None: self.expl_noise = 0.1 # std of Gaussian exploration noise self.noise_clip = 0.5 # range to clip target policy noise self.batch_size = 100 # batch size for both actor and critic - self.buffer_size = 1000000 # replay buffer size \ No newline at end of file + self.buffer_size = 1000000 # replay buffer size