In [1]:
from ddpg3 import *
%matplotlib inline
[2016-07-20 09:18:08,203] Site environment registry incorrect: Scoreboard did not register all envs: set(['AcrobotContinuous-v0'])
In [2]:
car = ddpg(environment = 'MountainCarContinuous-v0', noise_scale= 1.0)
car.main()
[2016-07-20 09:18:08,247] Making new env: MountainCarContinuous-v0
state dim 2
action dim 1
[2016-07-20 09:18:11,507] Action '0.992385999557' is not contained within action space 'Box(1,)'.
result after minibatch no. 0 : mean squared error: 471.799285889
plotting the mu() policy learned by NN
plotting the Qfunction
action 0.0
action 0.5
action 1.0
action 1.5
action 2.0
result after minibatch no. 1000 : mean squared error: 185.021911621
plotting the mu() policy learned by NN
plotting the Qfunction
action 0.0
action 0.5
action 1.0
action 1.5
action 2.0
---------------------------------------------------------------------------
KeyboardInterrupt Traceback (most recent call last)
<ipython-input-2-e3ec9066d5ec> in <module>()
1 car = ddpg(environment = 'MountainCarContinuous-v0', noise_scale= 1.0)
----> 2 car.main()
/home/frederik/Dokumente/DeepRL/dpg/ddpg3.py in main(self)
459
460 self.initialize_training(self.sess)
--> 461 self.start_training()
462
463
/home/frederik/Dokumente/DeepRL/dpg/ddpg3.py in start_training(self, maxstep, dataname, save)
187
188 if (it+1) % plot_freq == 0:
--> 189 self.plot_episode_lengths(self.train_lengths)
190 self.plot_episode_lengths(self.test_lengths)
191
/home/frederik/Dokumente/DeepRL/dpg/ddpg3.py in plot_episode_lengths(self, lengths)
451 plt.ylabel("timesteps")
452
--> 453 plt.show()
454
455 def main(self):
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/pyplot.pyc in show(*args, **kw)
242 """
243 global _show
--> 244 return _show(*args, **kw)
245
246
/home/frederik/anaconda2/lib/python2.7/site-packages/ipykernel/pylab/backend_inline.pyc in show(close, block)
34 try:
35 for figure_manager in Gcf.get_all_fig_managers():
---> 36 display(figure_manager.canvas.figure)
37 finally:
38 show._to_draw = []
/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/display.pyc in display(*objs, **kwargs)
156 publish_display_data(data=obj, metadata=metadata)
157 else:
--> 158 format_dict, md_dict = format(obj, include=include, exclude=exclude)
159 if not format_dict:
160 # nothing to display (e.g. _ipython_display_ took over)
/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/formatters.pyc in format(self, obj, include, exclude)
175 md = None
176 try:
--> 177 data = formatter(obj)
178 except:
179 # FIXME: log the exception
<decorator-gen-9> in __call__(self, obj)
/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/formatters.pyc in catch_format_error(method, self, *args, **kwargs)
220 """show traceback on failed format call"""
221 try:
--> 222 r = method(self, *args, **kwargs)
223 except NotImplementedError:
224 # don't warn on NotImplementedErrors
/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/formatters.pyc in __call__(self, obj)
337 pass
338 else:
--> 339 return printer(obj)
340 # Finally look for special method names
341 method = _safe_get_formatter_method(obj, self.print_method)
/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/pylabtools.pyc in <lambda>(fig)
226
227 if 'png' in formats:
--> 228 png_formatter.for_type(Figure, lambda fig: print_figure(fig, 'png', **kwargs))
229 if 'retina' in formats or 'png2x' in formats:
230 png_formatter.for_type(Figure, lambda fig: retina_figure(fig, **kwargs))
/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/pylabtools.pyc in print_figure(fig, fmt, bbox_inches, **kwargs)
117
118 bytes_io = BytesIO()
--> 119 fig.canvas.print_figure(bytes_io, **kw)
120 data = bytes_io.getvalue()
121 if fmt == 'svg':
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/backend_bases.pyc in print_figure(self, filename, dpi, facecolor, edgecolor, orientation, format, **kwargs)
2178 orientation=orientation,
2179 dryrun=True,
-> 2180 **kwargs)
2181 renderer = self.figure._cachedRenderer
2182 bbox_inches = self.figure.get_tightbbox(renderer)
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/backends/backend_agg.pyc in print_png(self, filename_or_obj, *args, **kwargs)
525
526 def print_png(self, filename_or_obj, *args, **kwargs):
--> 527 FigureCanvasAgg.draw(self)
528 renderer = self.get_renderer()
529 original_dpi = renderer.dpi
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/backends/backend_agg.pyc in draw(self)
472
473 try:
--> 474 self.figure.draw(self.renderer)
475 finally:
476 RendererAgg.lock.release()
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/artist.pyc in draw_wrapper(artist, renderer, *args, **kwargs)
59 def draw_wrapper(artist, renderer, *args, **kwargs):
60 before(artist, renderer)
---> 61 draw(artist, renderer, *args, **kwargs)
62 after(artist, renderer)
63
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/figure.pyc in draw(self, renderer)
1157 dsu.sort(key=itemgetter(0))
1158 for zorder, a, func, args in dsu:
-> 1159 func(*args)
1160
1161 renderer.close_group('figure')
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/artist.pyc in draw_wrapper(artist, renderer, *args, **kwargs)
59 def draw_wrapper(artist, renderer, *args, **kwargs):
60 before(artist, renderer)
---> 61 draw(artist, renderer, *args, **kwargs)
62 after(artist, renderer)
63
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axes/_base.pyc in draw(self, renderer, inframe)
2322
2323 for zorder, a in dsu:
-> 2324 a.draw(renderer)
2325
2326 renderer.close_group('axes')
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/artist.pyc in draw_wrapper(artist, renderer, *args, **kwargs)
59 def draw_wrapper(artist, renderer, *args, **kwargs):
60 before(artist, renderer)
---> 61 draw(artist, renderer, *args, **kwargs)
62 after(artist, renderer)
63
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in draw(self, renderer, *args, **kwargs)
1104 renderer.open_group(__name__)
1105
-> 1106 ticks_to_draw = self._update_ticks(renderer)
1107 ticklabelBoxes, ticklabelBoxes2 = self._get_tick_bboxes(ticks_to_draw,
1108 renderer)
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in _update_ticks(self, renderer)
947
948 interval = self.get_view_interval()
--> 949 tick_tups = [t for t in self.iter_ticks()]
950 if self._smart_bounds:
951 # handle inverted limits
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in iter_ticks(self)
897
898 minorLocs = self.minor.locator()
--> 899 minorTicks = self.get_minor_ticks(len(minorLocs))
900 self.minor.formatter.set_locs(minorLocs)
901 minorLabels = [self.minor.formatter(val, i)
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in get_minor_ticks(self, numticks)
1316 # update the new tick label properties from the old
1317 for i in range(numticks - len(self.minorTicks)):
-> 1318 tick = self._get_tick(major=False)
1319 self.minorTicks.append(tick)
1320
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in _get_tick(self, major)
1998 else:
1999 tick_kw = self._minor_tick_kw
-> 2000 return YTick(self.axes, 0, '', major=major, **tick_kw)
2001
2002 def _get_label(self):
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in __init__(self, axes, loc, label, size, width, color, tickdir, pad, labelsize, labelcolor, zorder, gridOn, tick1On, tick2On, label1On, label2On, major)
149
150 self.tick1line = self._get_tick1line()
--> 151 self.tick2line = self._get_tick2line()
152 self.gridline = self._get_gridline()
153
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in _get_tick2line(self)
550 markersize=self._size,
551 markeredgewidth=self._width,
--> 552 zorder=self._zorder)
553 l.set_transform(self.axes.get_yaxis_transform(which='tick2'))
554 self._set_artist_props(l)
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/lines.pyc in __init__(self, xdata, ydata, linewidth, linestyle, color, marker, markersize, markeredgewidth, markeredgecolor, markerfacecolor, markerfacecoloralt, fillstyle, antialiased, dash_capstyle, solid_capstyle, dash_joinstyle, solid_joinstyle, pickradius, drawstyle, markevery, **kwargs)
337 self.set_color(color)
338 self._marker = MarkerStyle()
--> 339 self.set_marker(marker)
340
341 self._markevery = None
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/lines.pyc in set_marker(self, marker)
1069
1070 """
-> 1071 self._marker.set_marker(marker)
1072 self.stale = True
1073
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/markers.pyc in set_marker(self, marker)
253
254 self._marker = marker
--> 255 self._recache()
256
257 def get_path(self):
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/markers.pyc in _recache(self)
184 def _recache(self):
185 self._path = Path(np.empty((0, 2)))
--> 186 self._transform = IdentityTransform()
187 self._alt_path = None
188 self._alt_transform = None
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/transforms.pyc in __init__(self, *args, **kwargs)
1639
1640 def __init__(self, *args, **kwargs):
-> 1641 Transform.__init__(self, *args, **kwargs)
1642 self._inverted = None
1643
/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/transforms.pyc in __init__(self, shorthand_name)
96 # parents are deleted, references from the children won't keep
97 # them alive.
---> 98 self._parents = WeakValueDictionary()
99
100 # TransformNodes start out as invalid until their values are
/home/frederik/anaconda2/lib/python2.7/weakref.pyc in __init__(*args, **kw)
64 self._pending_removals = []
65 self._iterating = set()
---> 66 UserDict.UserDict.__init__(self, *args, **kw)
67
68 def _commit_removals(self):
/home/frederik/anaconda2/lib/python2.7/UserDict.pyc in __init__(*args, **kwargs)
2
3 class UserDict:
----> 4 def __init__(*args, **kwargs):
5 if not args:
6 raise TypeError("descriptor '__init__' of 'UserDict' object "
KeyboardInterrupt:
In [ ]:
In [ ]:
Content source: febert/DeepRL
Similar notebooks: