In [1]:
from MonteCarloControl import MonteCarloControl
import pickle
from TDControl import Sarsa
from Utility import Plot2D
import numpy as np
In [2]:
mc = MonteCarloControl()
mc.solve(10000000, 100)
with open("q_star_100.obj", 'wb') as output:
pickle.dump(mc.q, output)
In [3]:
with open("q_star_100.obj", 'rb') as output:
q_star = pickle.load(output)
sarsa = Sarsa(q_star)
lambda_mse = []
for n_lambda in np.arange(0, 1.1, 0.1):
lambda_mse.append(sarsa.solve(n_lambda))
In [4]:
Plot2D(np.arange(0, 1.1, 0.1), lambda_mse)
In [5]:
mse = sarsa.solve(0, need_list=True)
In [6]:
Plot2D(range(1000), mse)
In [7]:
mse = sarsa.solve(1, need_list=True)
In [8]:
Plot2D(range(1000), mse)
In [ ]: