From db890f83cf8272abc066eef67e4ffbfeacd9a65a Mon Sep 17 00:00:00 2001 From: weixin_46229132 Date: Fri, 14 Mar 2025 09:22:40 +0800 Subject: [PATCH] =?UTF-8?q?=E6=94=B9=E7=BD=91=E7=BB=9C=E7=9A=84=E6=BF=80?= =?UTF-8?q?=E6=B4=BB=E5=87=BD=E6=95=B0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- PPO2/PPO.py | 20 ++++++++++---------- 1 file changed, 10 insertions(+), 10 deletions(-) diff --git a/PPO2/PPO.py b/PPO2/PPO.py index c071b9b..286203d 100644 --- a/PPO2/PPO.py +++ b/PPO2/PPO.py @@ -48,17 +48,17 @@ class ActorCritic(nn.Module): if has_continuous_action_space : self.actor = nn.Sequential( nn.Linear(state_dim, 64), - nn.Tanh(), + # nn.Tanh(), # nn.Sigmoid(), - # nn.ReLU(), + nn.ReLU(), nn.Linear(64, 64), - nn.Tanh(), + # nn.Tanh(), # nn.Sigmoid(), - # nn.ReLU(), + nn.ReLU(), nn.Linear(64, action_dim), - nn.Tanh() + # nn.Tanh() # nn.Sigmoid() - # nn.ReLU() + nn.ReLU() ) else: self.actor = nn.Sequential( @@ -72,13 +72,13 @@ class ActorCritic(nn.Module): # critic self.critic = nn.Sequential( nn.Linear(state_dim, 64), - nn.Tanh(), + # nn.Tanh(), # nn.Sigmoid(), - # nn.ReLU(), + nn.ReLU(), nn.Linear(64, 64), - nn.Tanh(), + # nn.Tanh(), # nn.Sigmoid(), - # nn.ReLU(), + nn.ReLU(), nn.Linear(64, 1) )