HPCC2025/human_action.py

24 lines
617 B
Python
Raw Normal View History

2025-03-28 21:37:31 +08:00
# from env import PartitionMazeEnv
2025-03-22 09:47:52 +08:00
# from env_dis import PartitionMazeEnv
2025-03-29 21:28:39 +08:00
from env_partion_dist import PartitionEnv
2025-03-14 09:42:56 +08:00
2025-03-28 21:37:31 +08:00
# env = PartitionMazeEnv()
env = PartitionEnv()
2025-03-14 09:42:56 +08:00
state = env.reset()
2025-03-28 21:37:31 +08:00
print('state:', state)
2025-03-14 09:42:56 +08:00
2025-03-28 21:37:31 +08:00
# action_series = [[0.67], [0], [0], [0], [0.7]]
2025-04-01 20:45:13 +08:00
action_series = [3, 3, 3, 5, 5, 1, 1, 1, 0, 0, 0]
# action_series = [1] * 30
2025-03-29 16:53:03 +08:00
# action_series = [[0.2], [0.4], [0.7], [0.5]]
2025-03-29 21:28:39 +08:00
# action_series = [[-0.08], [-0.08], [0], [0]]
2025-03-14 09:42:56 +08:00
2025-03-14 15:27:05 +08:00
for i in range(100):
2025-03-14 09:42:56 +08:00
action = action_series[i]
state, reward, done, info, _ = env.step(action)
2025-03-28 21:37:31 +08:00
print('state:', state)
print('reward:', reward)
2025-03-14 09:42:56 +08:00
if done:
2025-03-19 01:04:03 +08:00
break