DQN让它先看答案

2025-03-20 14:05:15 +08:00 · 2025-03-20 14:05:15 +08:00 · 67c7a9d6c7
commit 67c7a9d6c7
parent f4fb963c06
2 changed files with 7 additions and 5 deletions
--- a/Duel_Double_DQN/main.py
+++ b/Duel_Double_DQN/main.py
@ -123,10 +123,12 @@ def main():
            while not done:
                # e-greedy exploration
                if total_steps < opt.random_steps:
-                    if s[0] == 0:
-                        a = np.random.randint(0, 10)
-                    else:
-                        a = np.random.randint(10, 14)
+                    # if s[0] == 0:
+                    #     a = np.random.randint(0, 10)
+                    # else:
+                    #     a = np.random.randint(10, 14)
+                    action_series = [0, 0, 3, 0, 10]
+                    a = action_series[total_steps % 5]
                else:
                    a = agent.select_action(s, deterministic=False)
                s_next, r, dw, tr, info = env.step(a)
--- a/env_dis.py
+++ b/env_dis.py
@ -275,7 +275,7 @@ class PartitionMazeEnv(gym.Env):
                # print(self.partition_values)
                # print(self.car_traj)
                reward += self.BASE_LINE / T * 1000
-                print(reward)
+                # print(reward)
            elif done and self.step_count >= self.MAX_STEPS:
                reward += -1000