(206.0, 'of', 500, ', lr:', 0.29171528588098017)
(183.0, 'of', 500, ', lr:', 0.20650916900710392)
(207.0, 'of', 500, ', lr:', 0.15776603297310088)
(221.0, 'of', 500, ', lr:', 0.12708418056120374)
(242.0, 'of', 500, ', lr:', 0.1060096892856007)
(251.0, 'of', 500, ', lr:', 0.09105892422986915)
(224.0, 'of', 500, ', lr:', 0.07998400319936012)
(269.0, 'of', 500, ', lr:', 0.07036802476954472)
(265.0, 'of', 500, ', lr:', 0.06298339757639886)
---------------------------------------------------------------------------
KeyboardInterrupt Traceback (most recent call last)
<ipython-input-14-e916f46b95f9> in <module>()
----> 1 model.fit(env)
/home/cristian/data/cristian/tfinterface/tfinterface/reinforcement/reinforcement_base.py in fit(self, *args, **kwargs)
468
469 def fit(self, *args, **kwargs):
--> 470 self.trainer.fit(*args, **kwargs)
471
472 @abstractmethod
/home/cristian/data/cristian/tfinterface/tfinterface/reinforcement/reinforcement_base.py in fit(self, env, episodes, max_episodes)
531 experience = self.get_experience(s, a, r, s1, done, info)
532 self.experience_buffer.append(experience)
--> 533 self.train_on_experience(*experience)
534 self.after_experience(*experience)
535
<ipython-input-13-d3f257c92ec1> in train_on_experience(self, *experience)
73 def train_on_experience(self, *experience):
74 feed_dict = self.model.experience_feed(*experience)
---> 75 self.model.sess.run(self.model.update, feed_dict=feed_dict)
76
77 def after_episode(self, *args):
/usr/local/lib/python2.7/dist-packages/tensorflow/python/client/session.pyc in run(self, fetches, feed_dict, options, run_metadata)
765 try:
766 result = self._run(None, fetches, feed_dict, options_ptr,
--> 767 run_metadata_ptr)
768 if run_metadata:
769 proto_data = tf_session.TF_GetBuffer(run_metadata_ptr)
/usr/local/lib/python2.7/dist-packages/tensorflow/python/client/session.pyc in _run(self, handle, fetches, feed_dict, options, run_metadata)
936 ' to a larger type (e.g. int64).')
937
--> 938 np_val = np.asarray(subfeed_val, dtype=subfeed_dtype)
939
940 if not subfeed_t.get_shape().is_compatible_with(np_val.shape):
/usr/local/lib/python2.7/dist-packages/numpy/core/numeric.pyc in asarray(a, dtype, order)
529
530 """
--> 531 return array(a, dtype, copy=False, order=order)
532
533
KeyboardInterrupt: