In [1]:
from run import *
%matplotlib inline


[2016-07-17 15:47:19,894] Site environment registry incorrect: Scoreboard did not register all envs: set(['AcrobotContinuous-v0'])

In [2]:
e = Experiment()
e.run()


[2016-07-17 15:47:20,092] Making new env: InvertedPendulum-v1
('action center a_c', array([ 0.]))
('action scale a_c', array([ 3.]))
True action space: [-3.], [ 3.]
True state space: [-inf -inf -inf -inf], [ inf  inf  inf  inf]
Filtered action space: [-1.], [ 1.]
Filtered state space: [-inf -inf -inf -inf], [ inf  inf  inf  inf]
observationspace action space ((4,), (1,))
{'_entry_point': 'gym.envs.mujoco:InvertedPendulumEnv',
 '_env_name': 'InvertedPendulum',
 '_kwargs': {},
 '_local_only': False,
 'id': 'InvertedPendulum-v1',
 'nondeterministic': False,
 'reward_threshold': 950.0,
 'timestep_limit': 1000,
 'trials': 100}
[2016-07-17 15:47:23,020] Action '[-1.16931295]' is not contained within action space 'Box(1,)'.
---------------------------------------------------------------------------
KeyboardInterrupt                         Traceback (most recent call last)
<ipython-input-2-086fdd659d45> in <module>()
      1 e = Experiment()
----> 2 e.run()

/home/frederik/Dokumente/DeepRL/ddpg_working/run.py in run(self)
     68                 it +=1
     69 
---> 70                 episodelengths.append(self.run_episode(test=False))
     71                 # print(episodelengths[-1])
     72 

/home/frederik/Dokumente/DeepRL/ddpg_working/run.py in run_episode(self, test, monitor)
    137 
    138             r_f = self.env.filter_reward(reward)
--> 139             self.agent.observe(r_f, term, observation, test=test and not FLAGS.tot)
    140 
    141             if test:

/home/frederik/Dokumente/DeepRL/ddpg_working/ddpg.py in observe(self, rew, term, obs2, test)
    170             if self.t > FLAGS.warmup:
    171                 # print('warmed up')
--> 172                 self.train()
    173 
    174             # elif FLAGS.warmq and self.rm.n > 1000:

/home/frederik/Dokumente/DeepRL/ddpg_working/ddpg.py in train(self)
    188 
    189         if FLAGS.async:
--> 190             self._train(obs, act, rew, ob2, term2, log=log, global_step=self.t)
    191         else:
    192             self._train_q(obs, act, rew, ob2, term2, log=log, global_step=self.t)

/home/frederik/Dokumente/DeepRL/ddpg_working/ddpg.py in __call__(self, *args, **kwargs)
    241 
    242         out = self._outputs + [self._summary_op] if log else self._outputs
--> 243         res = self._session.run(out, feeds)
    244 
    245         if log:

/home/frederik/anaconda2/lib/python2.7/site-packages/tensorflow/python/client/session.pyc in run(self, fetches, feed_dict, options, run_metadata)
    370     try:
    371       result = self._run(None, fetches, feed_dict, options_ptr,
--> 372                          run_metadata_ptr)
    373       if run_metadata:
    374         proto_data = tf_session.TF_GetBuffer(run_metadata_ptr)

/home/frederik/anaconda2/lib/python2.7/site-packages/tensorflow/python/client/session.pyc in _run(self, handle, fetches, feed_dict, options, run_metadata)
    634     try:
    635       results = self._do_run(handle, target_list, unique_fetches,
--> 636                              feed_dict_string, options, run_metadata)
    637     finally:
    638       # The movers are no longer used. Delete them.

/home/frederik/anaconda2/lib/python2.7/site-packages/tensorflow/python/client/session.pyc in _do_run(self, handle, target_list, fetch_list, feed_dict, options, run_metadata)
    706     if handle is None:
    707       return self._do_call(_run_fn, self._session, feed_dict, fetch_list,
--> 708                            target_list, options, run_metadata)
    709     else:
    710       return self._do_call(_prun_fn, self._session, handle, feed_dict,

/home/frederik/anaconda2/lib/python2.7/site-packages/tensorflow/python/client/session.pyc in _do_call(self, fn, *args)
    713   def _do_call(self, fn, *args):
    714     try:
--> 715       return fn(*args)
    716     except errors.OpError as e:
    717       message = compat.as_text(e.message)

/home/frederik/anaconda2/lib/python2.7/site-packages/tensorflow/python/client/session.pyc in _run_fn(session, feed_dict, fetch_list, target_list, options, run_metadata)
    695         return tf_session.TF_Run(session, options,
    696                                  feed_dict, fetch_list, target_list,
--> 697                                  status, run_metadata)
    698 
    699     def _prun_fn(session, handle, feed_dict, fetch_list):

KeyboardInterrupt: 

In [ ]: