diff --git a/env.py b/env.py index b1b84cc..6765df9 100644 --- a/env.py +++ b/env.py @@ -40,7 +40,7 @@ class PartitionMazeEnv(gym.Env): # 可能需要手动修改的超参数 ############################## self.CUT_NUM = 4 # 横切一半,竖切一半 - self.BASE_LINE = 3500 # 基准时间,通过greedy或者蒙特卡洛计算出来 + self.BASE_LINE = 4000 # 基准时间,通过greedy或者蒙特卡洛计算出来 self.MAX_STEPS = 50 # 迷宫走法步数上限 self.phase = 0 # 阶段控制,0:区域划分阶段,1:迷宫初始化阶段,2:走迷宫阶段 diff --git a/env_dis.py b/env_dis.py index 91ac312..9c7e811 100644 --- a/env_dis.py +++ b/env_dis.py @@ -275,6 +275,7 @@ class PartitionMazeEnv(gym.Env): # print(self.partition_values) # print(self.car_traj) reward += self.BASE_LINE / T * 1000 + print(reward) elif done and self.step_count >= self.MAX_STEPS: reward += -1000