In [1]:
from ddpg3 import *
%matplotlib inline


[2016-07-20 09:18:08,203] Site environment registry incorrect: Scoreboard did not register all envs: set(['AcrobotContinuous-v0'])

In [2]:
car = ddpg(environment = 'MountainCarContinuous-v0', noise_scale= 1.0)
car.main()


[2016-07-20 09:18:08,247] Making new env: MountainCarContinuous-v0
state dim 2
action dim 1
[2016-07-20 09:18:11,507] Action '0.992385999557' is not contained within action space 'Box(1,)'.
result after minibatch no. 0 : mean squared error: 471.799285889
plotting the mu() policy learned by NN
plotting the Qfunction
action 0.0
action 0.5
action 1.0
action 1.5
action 2.0
result after minibatch no. 1000 : mean squared error: 185.021911621
plotting the mu() policy learned by NN
plotting the Qfunction
action 0.0
action 0.5
action 1.0
action 1.5
action 2.0
---------------------------------------------------------------------------
KeyboardInterrupt                         Traceback (most recent call last)
<ipython-input-2-e3ec9066d5ec> in <module>()
      1 car = ddpg(environment = 'MountainCarContinuous-v0', noise_scale= 1.0)
----> 2 car.main()

/home/frederik/Dokumente/DeepRL/dpg/ddpg3.py in main(self)
    459 
    460         self.initialize_training(self.sess)
--> 461         self.start_training()
    462 
    463 

/home/frederik/Dokumente/DeepRL/dpg/ddpg3.py in start_training(self, maxstep, dataname, save)
    187 
    188             if (it+1) % plot_freq == 0:
--> 189                 self.plot_episode_lengths(self.train_lengths)
    190                 self.plot_episode_lengths(self.test_lengths)
    191 

/home/frederik/Dokumente/DeepRL/dpg/ddpg3.py in plot_episode_lengths(self, lengths)
    451             plt.ylabel("timesteps")
    452 
--> 453             plt.show()
    454 
    455     def main(self):

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/pyplot.pyc in show(*args, **kw)
    242     """
    243     global _show
--> 244     return _show(*args, **kw)
    245 
    246 

/home/frederik/anaconda2/lib/python2.7/site-packages/ipykernel/pylab/backend_inline.pyc in show(close, block)
     34     try:
     35         for figure_manager in Gcf.get_all_fig_managers():
---> 36             display(figure_manager.canvas.figure)
     37     finally:
     38         show._to_draw = []

/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/display.pyc in display(*objs, **kwargs)
    156             publish_display_data(data=obj, metadata=metadata)
    157         else:
--> 158             format_dict, md_dict = format(obj, include=include, exclude=exclude)
    159             if not format_dict:
    160                 # nothing to display (e.g. _ipython_display_ took over)

/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/formatters.pyc in format(self, obj, include, exclude)
    175             md = None
    176             try:
--> 177                 data = formatter(obj)
    178             except:
    179                 # FIXME: log the exception

<decorator-gen-9> in __call__(self, obj)

/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/formatters.pyc in catch_format_error(method, self, *args, **kwargs)
    220     """show traceback on failed format call"""
    221     try:
--> 222         r = method(self, *args, **kwargs)
    223     except NotImplementedError:
    224         # don't warn on NotImplementedErrors

/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/formatters.pyc in __call__(self, obj)
    337                 pass
    338             else:
--> 339                 return printer(obj)
    340             # Finally look for special method names
    341             method = _safe_get_formatter_method(obj, self.print_method)

/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/pylabtools.pyc in <lambda>(fig)
    226 
    227     if 'png' in formats:
--> 228         png_formatter.for_type(Figure, lambda fig: print_figure(fig, 'png', **kwargs))
    229     if 'retina' in formats or 'png2x' in formats:
    230         png_formatter.for_type(Figure, lambda fig: retina_figure(fig, **kwargs))

/home/frederik/anaconda2/lib/python2.7/site-packages/IPython/core/pylabtools.pyc in print_figure(fig, fmt, bbox_inches, **kwargs)
    117 
    118     bytes_io = BytesIO()
--> 119     fig.canvas.print_figure(bytes_io, **kw)
    120     data = bytes_io.getvalue()
    121     if fmt == 'svg':

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/backend_bases.pyc in print_figure(self, filename, dpi, facecolor, edgecolor, orientation, format, **kwargs)
   2178                     orientation=orientation,
   2179                     dryrun=True,
-> 2180                     **kwargs)
   2181                 renderer = self.figure._cachedRenderer
   2182                 bbox_inches = self.figure.get_tightbbox(renderer)

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/backends/backend_agg.pyc in print_png(self, filename_or_obj, *args, **kwargs)
    525 
    526     def print_png(self, filename_or_obj, *args, **kwargs):
--> 527         FigureCanvasAgg.draw(self)
    528         renderer = self.get_renderer()
    529         original_dpi = renderer.dpi

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/backends/backend_agg.pyc in draw(self)
    472 
    473         try:
--> 474             self.figure.draw(self.renderer)
    475         finally:
    476             RendererAgg.lock.release()

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/artist.pyc in draw_wrapper(artist, renderer, *args, **kwargs)
     59     def draw_wrapper(artist, renderer, *args, **kwargs):
     60         before(artist, renderer)
---> 61         draw(artist, renderer, *args, **kwargs)
     62         after(artist, renderer)
     63 

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/figure.pyc in draw(self, renderer)
   1157         dsu.sort(key=itemgetter(0))
   1158         for zorder, a, func, args in dsu:
-> 1159             func(*args)
   1160 
   1161         renderer.close_group('figure')

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/artist.pyc in draw_wrapper(artist, renderer, *args, **kwargs)
     59     def draw_wrapper(artist, renderer, *args, **kwargs):
     60         before(artist, renderer)
---> 61         draw(artist, renderer, *args, **kwargs)
     62         after(artist, renderer)
     63 

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axes/_base.pyc in draw(self, renderer, inframe)
   2322 
   2323         for zorder, a in dsu:
-> 2324             a.draw(renderer)
   2325 
   2326         renderer.close_group('axes')

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/artist.pyc in draw_wrapper(artist, renderer, *args, **kwargs)
     59     def draw_wrapper(artist, renderer, *args, **kwargs):
     60         before(artist, renderer)
---> 61         draw(artist, renderer, *args, **kwargs)
     62         after(artist, renderer)
     63 

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in draw(self, renderer, *args, **kwargs)
   1104         renderer.open_group(__name__)
   1105 
-> 1106         ticks_to_draw = self._update_ticks(renderer)
   1107         ticklabelBoxes, ticklabelBoxes2 = self._get_tick_bboxes(ticks_to_draw,
   1108                                                                 renderer)

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in _update_ticks(self, renderer)
    947 
    948         interval = self.get_view_interval()
--> 949         tick_tups = [t for t in self.iter_ticks()]
    950         if self._smart_bounds:
    951             # handle inverted limits

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in iter_ticks(self)
    897 
    898         minorLocs = self.minor.locator()
--> 899         minorTicks = self.get_minor_ticks(len(minorLocs))
    900         self.minor.formatter.set_locs(minorLocs)
    901         minorLabels = [self.minor.formatter(val, i)

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in get_minor_ticks(self, numticks)
   1316             # update the new tick label properties from the old
   1317             for i in range(numticks - len(self.minorTicks)):
-> 1318                 tick = self._get_tick(major=False)
   1319                 self.minorTicks.append(tick)
   1320 

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in _get_tick(self, major)
   1998         else:
   1999             tick_kw = self._minor_tick_kw
-> 2000         return YTick(self.axes, 0, '', major=major, **tick_kw)
   2001 
   2002     def _get_label(self):

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in __init__(self, axes, loc, label, size, width, color, tickdir, pad, labelsize, labelcolor, zorder, gridOn, tick1On, tick2On, label1On, label2On, major)
    149 
    150         self.tick1line = self._get_tick1line()
--> 151         self.tick2line = self._get_tick2line()
    152         self.gridline = self._get_gridline()
    153 

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/axis.pyc in _get_tick2line(self)
    550                           markersize=self._size,
    551                           markeredgewidth=self._width,
--> 552                           zorder=self._zorder)
    553         l.set_transform(self.axes.get_yaxis_transform(which='tick2'))
    554         self._set_artist_props(l)

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/lines.pyc in __init__(self, xdata, ydata, linewidth, linestyle, color, marker, markersize, markeredgewidth, markeredgecolor, markerfacecolor, markerfacecoloralt, fillstyle, antialiased, dash_capstyle, solid_capstyle, dash_joinstyle, solid_joinstyle, pickradius, drawstyle, markevery, **kwargs)
    337         self.set_color(color)
    338         self._marker = MarkerStyle()
--> 339         self.set_marker(marker)
    340 
    341         self._markevery = None

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/lines.pyc in set_marker(self, marker)
   1069 
   1070         """
-> 1071         self._marker.set_marker(marker)
   1072         self.stale = True
   1073 

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/markers.pyc in set_marker(self, marker)
    253 
    254         self._marker = marker
--> 255         self._recache()
    256 
    257     def get_path(self):

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/markers.pyc in _recache(self)
    184     def _recache(self):
    185         self._path = Path(np.empty((0, 2)))
--> 186         self._transform = IdentityTransform()
    187         self._alt_path = None
    188         self._alt_transform = None

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/transforms.pyc in __init__(self, *args, **kwargs)
   1639 
   1640     def __init__(self, *args, **kwargs):
-> 1641         Transform.__init__(self, *args, **kwargs)
   1642         self._inverted = None
   1643 

/home/frederik/anaconda2/lib/python2.7/site-packages/matplotlib/transforms.pyc in __init__(self, shorthand_name)
     96         # parents are deleted, references from the children won't keep
     97         # them alive.
---> 98         self._parents = WeakValueDictionary()
     99 
    100         # TransformNodes start out as invalid until their values are

/home/frederik/anaconda2/lib/python2.7/weakref.pyc in __init__(*args, **kw)
     64         self._pending_removals = []
     65         self._iterating = set()
---> 66         UserDict.UserDict.__init__(self, *args, **kw)
     67 
     68     def _commit_removals(self):

/home/frederik/anaconda2/lib/python2.7/UserDict.pyc in __init__(*args, **kwargs)
      2 
      3 class UserDict:
----> 4     def __init__(*args, **kwargs):
      5         if not args:
      6             raise TypeError("descriptor '__init__' of 'UserDict' object "

KeyboardInterrupt: 

In [ ]:


In [ ]: