HPCC2025/human_action.py
weixin_46229132 84f69f4293 离散情况
2025-03-29 21:28:39 +08:00

24 lines
600 B
Python

# from env import PartitionMazeEnv
# from env_dis import PartitionMazeEnv
from env_partion_dist import PartitionEnv
# env = PartitionMazeEnv()
env = PartitionEnv()
state = env.reset()
print('state:', state)
# action_series = [[0.67], [0], [0], [0], [0.7]]
action_series = [1, 1, 1, 1, 1, 1]
action_series = [1] * 30
# action_series = [[0.2], [0.4], [0.7], [0.5]]
# action_series = [[-0.08], [-0.08], [0], [0]]
for i in range(100):
action = action_series[i]
state, reward, done, info, _ = env.step(action)
print('state:', state)
print('reward:', reward)
if done:
break