HPCC2025/human_action.py

19 lines
380 B
Python
Raw Normal View History

2025-03-19 20:40:35 +08:00
# from env import PartitionMazeEnv
from env_dis import PartitionMazeEnv
2025-03-14 09:42:56 +08:00
env = PartitionMazeEnv()
state = env.reset()
print(state)
2025-03-19 20:40:35 +08:00
# action_series = [[0], [0], [0.4], [0], [0.1]]
action_series = [0, 0, 3, 0, 10]
2025-03-14 09:42:56 +08:00
2025-03-14 15:27:05 +08:00
for i in range(100):
2025-03-14 09:42:56 +08:00
action = action_series[i]
state, reward, done, info, _ = env.step(action)
2025-03-19 20:40:35 +08:00
print(state)
print(reward)
2025-03-14 09:42:56 +08:00
if done:
2025-03-19 01:04:03 +08:00
break