2025-03-22 09:47:52 +08:00
|
|
|
from env import PartitionMazeEnv
|
|
|
|
# from env_dis import PartitionMazeEnv
|
2025-03-14 09:42:56 +08:00
|
|
|
|
|
|
|
env = PartitionMazeEnv()
|
|
|
|
|
|
|
|
state = env.reset()
|
|
|
|
print(state)
|
|
|
|
|
2025-03-22 09:47:52 +08:00
|
|
|
action_series = [[0.67], [0], [0], [0], [0.7]]
|
|
|
|
# action_series = [0, 0, 3, 0, 10]
|
2025-03-14 09:42:56 +08:00
|
|
|
|
2025-03-14 15:27:05 +08:00
|
|
|
for i in range(100):
|
2025-03-14 09:42:56 +08:00
|
|
|
action = action_series[i]
|
|
|
|
state, reward, done, info, _ = env.step(action)
|
2025-03-19 20:40:35 +08:00
|
|
|
print(state)
|
|
|
|
print(reward)
|
2025-03-14 09:42:56 +08:00
|
|
|
if done:
|
2025-03-19 01:04:03 +08:00
|
|
|
break
|