2025-03-14 09:42:56 +08:00
|
|
|
from env import PartitionMazeEnv
|
|
|
|
|
|
|
|
env = PartitionMazeEnv()
|
|
|
|
|
|
|
|
state = env.reset()
|
|
|
|
print(state)
|
|
|
|
|
2025-03-14 11:17:12 +08:00
|
|
|
action_series = [[0], [0.3], [0], [0], [0.1], [0.7]]
|
2025-03-14 09:42:56 +08:00
|
|
|
|
|
|
|
for i in range(10):
|
|
|
|
action = action_series[i]
|
|
|
|
state, reward, done, info, _ = env.step(action)
|
|
|
|
print(state, reward, done, info)
|
|
|
|
if done:
|
|
|
|
break
|