# from env import PartitionMazeEnv
from env_dis import PartitionMazeEnv

env = PartitionMazeEnv()

state = env.reset()
print(state)

# action_series = [[0], [0], [0.4], [0], [0.1]]
action_series = [0, 0, 3, 0, 10]

for i in range(100):
    action = action_series[i]
    state, reward, done, info, _ = env.step(action)
    print(state)
    print(reward)
    if done:
        break