In [1]:
from transition_table import TransitionTable
from action import Action
import numpy as np
table = TransitionTable()
img = np.ones((84, 84))
img2 = 2 * np.ones((84, 84))
table.add_transition(img, False, Action(2), 0.5, True)
table.add_transition(img2, False, Action(3), 0.7, False)
In [ ]:
recent = table.get_recent()
for i in range(4):
print np.linalg.norm(recent[:, :, i])
In [14]:
s, t, a, r, sp = table.get_minibatch()
print sp[0, 20, 20, :]
print s[0, 20, 20, :]
In [ ]:
In [ ]:
print table.get_recent()
In [ ]:
table.transitions[0].was_start
In [ ]: