diff --git a/baselines/ddpg/ddpg.py b/baselines/ddpg/ddpg.py index 37551d4931..4bbda692b9 100755 --- a/baselines/ddpg/ddpg.py +++ b/baselines/ddpg/ddpg.py @@ -58,7 +58,7 @@ def learn(network, env, rank = 0 nb_actions = env.action_space.shape[-1] - assert (np.abs(env.action_space.low) == env.action_space.high).all() # we assume symmetric actions. + #assert (np.abs(env.action_space.low) == env.action_space.high).all() # we assume symmetric actions. memory = Memory(limit=int(1e6), action_shape=env.action_space.shape, observation_shape=env.observation_space.shape) critic = Critic(network=network, **network_kwargs) diff --git a/baselines/run.py b/baselines/run.py index 609de6ec5c..caf00e0a1c 100644 --- a/baselines/run.py +++ b/baselines/run.py @@ -50,7 +50,7 @@ 'SpaceInvaders-Snes', } - +_game_envs['madras'] = {'gym-torcs-v0','gym-madras-v0'} def train(args, extra_args): env_type, env_id = get_env_type(args.env) print('env_type: {}'.format(env_type))