26 lines
803 B
Python
26 lines
803 B
Python
# from env import PartitionMazeEnv
|
|
# from env_dis import PartitionMazeEnv
|
|
from env_partion_dist import PartitionEnv
|
|
|
|
# env = PartitionMazeEnv()
|
|
env = PartitionEnv()
|
|
|
|
state = env.reset()
|
|
print('state:', state)
|
|
|
|
# action_series = [[0.67], [0], [0], [0], [0.7]]
|
|
# action_series = [3, 3, 3, 5, 5, 1, 1, 1, 0, 0, 0]
|
|
# action_series = [1] * 30
|
|
# action_series = [[0.2], [0.4], [0.7], [0.5]]
|
|
# action_series = [[-0.08], [-0.08], [0], [0]]
|
|
action_series = [3, 5, 3, 5, 1, 1, 3, 5, 1, 5, 3, 1, 1, 1, 1, 1, 2, 1, 2, 1, 2, 1,
|
|
2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1]
|
|
|
|
for i in range(100):
|
|
action = action_series[i]
|
|
state, reward, done, _, info = env.step(action)
|
|
print('state:', state)
|
|
print('reward:', reward)
|
|
if done:
|
|
break
|