In [26]:
import gym
env = gym.make('FrozenLake-v0')
policy=[0,2,1,0,
0,0,1,0,
2,2,1,0,
0,2,2,0]
sum_reward=0
for episode in range(100):
obs=env.reset()
done=False
#print("episode: {}".format(episode))
while not done:
obs,reward,done,info=env.step(policy[obs])
sum_reward+=reward
#env.render()
print(sum_reward)
In [ ]: