From 42d7ee2409c67d3703a8c9099ea2d843ea2ec934 Mon Sep 17 00:00:00 2001 From: Ariel_cr <58971000+cr-bh@users.noreply.github.com> Date: Tue, 21 Feb 2023 11:53:50 +0800 Subject: [PATCH] Update config.py --- joyrl/algos/TD3/config.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/joyrl/algos/TD3/config.py b/joyrl/algos/TD3/config.py index 6af1356..c8c7506 100644 --- a/joyrl/algos/TD3/config.py +++ b/joyrl/algos/TD3/config.py @@ -1,8 +1,8 @@ class AlgoConfig: def __init__(self) -> None: - self.explore_steps = 1000 # exploration steps before training + self.explore_steps = 100 # exploration steps before training self.policy_freq = 2 # policy update frequency - self.actor_lr = 1e-3 # actor learning rate 3e-4 + self.actor_lr = 1e-4 # actor learning rate 3e-4 self.critic_lr = 1e-3 # critic learning rate self.actor_hidden_dim = 256 # actor hidden layer dimension self.critic_hidden_dim = 256 # critic hidden layer dimension @@ -12,4 +12,4 @@ def __init__(self) -> None: self.expl_noise = 0.1 # std of Gaussian exploration noise self.noise_clip = 0.5 # range to clip target policy noise self.batch_size = 100 # batch size for both actor and critic - self.buffer_size = 1000000 # replay buffer size \ No newline at end of file + self.buffer_size = 1000000 # replay buffer size