diff --git a/examples/pybullet/gym/pybullet_envs/__init__.py b/examples/pybullet/gym/pybullet_envs/__init__.py index 369fc0f87..f681b2d99 100644 --- a/examples/pybullet/gym/pybullet_envs/__init__.py +++ b/examples/pybullet/gym/pybullet_envs/__init__.py @@ -18,7 +18,7 @@ register( register( id='RacecarBulletEnv-v0', - entry_point='pybullet_envs.bullet:RacecarBulletEnv', + entry_point='pybullet_envs.bullet:RacecarGymEnv', timestep_limit=1000, reward_threshold=5.0, ) diff --git a/examples/pybullet/gym/pybullet_envs/bullet/racecarGymEnv.py b/examples/pybullet/gym/pybullet_envs/bullet/racecarGymEnv.py index 458d265bd..1d4074262 100644 --- a/examples/pybullet/gym/pybullet_envs/bullet/racecarGymEnv.py +++ b/examples/pybullet/gym/pybullet_envs/bullet/racecarGymEnv.py @@ -43,7 +43,8 @@ class RacecarGymEnv(gym.Env): observationDim = 2 #len(self.getExtendedObservation()) #print("observationDim") #print(observationDim) - observation_high = np.array([np.finfo(np.float32).max] * observationDim) + # observation_high = np.array([np.finfo(np.float32).max] * observationDim) + observation_high = np.ones(observationDim) * 1000 #np.inf if (isDiscrete): self.action_space = spaces.Discrete(9) else: @@ -130,7 +131,19 @@ class RacecarGymEnv(gym.Env): return np.array(self._observation), reward, done, {} def _render(self, mode='human', close=False): - return + width=320 + height=200 + img_arr = self._p.getCameraImage(width,height) + w=img_arr[0] + h=img_arr[1] + rgb=img_arr[2] + dep=img_arr[3] + #print 'width = %d height = %d' % (w,h) + # reshape creates np array + np_img_arr = np.reshape(rgb, (h, w, 4)) + # remove alpha channel + np_img_arr = np_img_arr[:, :, :3] + return np_img_arr def _termination(self): return self._envStepCounter>1000 diff --git a/examples/pybullet/gym/pybullet_envs/examples/enjoy_pybullet_racecar.py b/examples/pybullet/gym/pybullet_envs/examples/enjoy_pybullet_racecar.py index 717d82343..ce3e74358 100644 --- a/examples/pybullet/gym/pybullet_envs/examples/enjoy_pybullet_racecar.py +++ b/examples/pybullet/gym/pybullet_envs/examples/enjoy_pybullet_racecar.py @@ -12,7 +12,7 @@ from baselines import deepq def main(): - env = RacecarGymEnv(renders=False,isDiscrete=True) + env = RacecarGymEnv(renders=True,isDiscrete=True) act = deepq.load("racecar_model.pkl") print(act) while True: diff --git a/examples/pybullet/gym/pybullet_envs/examples/racecarGymEnvTest.py b/examples/pybullet/gym/pybullet_envs/examples/racecarGymEnvTest.py index a2ef5a855..fb439042d 100644 --- a/examples/pybullet/gym/pybullet_envs/examples/racecarGymEnvTest.py +++ b/examples/pybullet/gym/pybullet_envs/examples/racecarGymEnvTest.py @@ -5,7 +5,7 @@ parentdir = os.path.dirname(os.path.dirname(currentdir)) os.sys.path.insert(0,parentdir) from pybullet_envs.bullet.racecarGymEnv import RacecarGymEnv -isDiscrete = True +isDiscrete = False environment = RacecarGymEnv(renders=True, isDiscrete=isDiscrete) environment.reset()