move pybullet.connect into the Gym environment.

If you like to enable rendering, call the env.render(mode="human") before calling the first env.reset
2017-08-26 14:58:48 -07:00
parent 51b7e1040f
commit e267f5c3d2
10 changed files with 44 additions and 53 deletions
--- a/examples/pybullet/gym/pybullet_envs/env_bases.py
+++ b/examples/pybullet/gym/pybullet_envs/env_bases.py
@@ -15,11 +15,11 @@ class MJCFBaseBulletEnv(gym.Env):
 		'video.frames_per_second': 60
 		}

-	def __init__(self, robot):
+	def __init__(self, robot, render=False):
 		self.scene = None
-
+		self.physicsClientId=-1
 		self.camera = Camera()
-
+		self.isRender = render
 		self.robot = robot

 		self._seed()
@@ -33,6 +33,15 @@ class MJCFBaseBulletEnv(gym.Env):
 		return [seed]

 	def _reset(self):
+		print("self.isRender=")
+		print(self.isRender)
+		if (self.physicsClientId<0):
+			if (self.isRender):
+				self.physicsClientId = p.connect(p.GUI)
+			else:
+				self.physicsClientId = p.connect(p.DIRECT)
+		p.configureDebugVisualizer(p.COV_ENABLE_GUI,0)
+  
 		if self.scene is None:
 			self.scene = self.create_single_player_scene()
 		if not self.scene.multiplayer:
@@ -49,7 +58,13 @@ class MJCFBaseBulletEnv(gym.Env):
 		return s

 	def _render(self, mode, close):
-		pass
+		if (mode=="human"):
+			self.isRender = True
+
+	def _close(self):
+		if (self.physicsClientId>=0):
+			p.disconnect(self.physicsClientId)
+			self.physicsClientId = -1

 	def HUD(self, state, a, done):
 		pass
--- a/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_AntBulletEnv_v0_2017may.py
+++ b/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_AntBulletEnv_v0_2017may.py
@@ -30,14 +30,10 @@ class SmallReactivePolicy:

 def main():
    env = gym.make("AntBulletEnv-v0")
+    env.render(mode="human")
    
-    cid = p.connect(p.GUI)
-    p.configureDebugVisualizer(p.COV_ENABLE_GUI,0)
    pi = SmallReactivePolicy(env.observation_space, env.action_space)
-
-    p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,0)
    env.reset()
-    p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,1)
    torsoId = -1
    for i in range (p.getNumBodies()):
        print(p.getBodyInfo(i))
@@ -49,9 +45,7 @@ def main():
        frame = 0
        score = 0
        restart_delay = 0
-        p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,0)
        obs = env.reset()
-        p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,1)
     
        while 1:
            time.sleep(0.001)
--- a/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_HalfCheetahBulletEnv_v0_2017may.py
+++ b/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_HalfCheetahBulletEnv_v0_2017may.py
@@ -29,15 +29,11 @@ class SmallReactivePolicy:

 def main():
    env = gym.make("HalfCheetahBulletEnv-v0")
-
-    cid = p.connect(p.GUI)
+    env.render(mode="human")

    pi = SmallReactivePolicy(env.observation_space, env.action_space)
    #disable rendering during reset, makes loading much faster
-    p.configureDebugVisualizer(p.COV_ENABLE_GUI,0)
-    p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,0)
    env.reset()
-    p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,1)
    torsoId = -1
    for i in range (p.getNumBodies()):
        print(p.getBodyInfo(i))
@@ -52,9 +48,7 @@ def main():
        frame = 0
        score = 0
        restart_delay = 0
-        p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,0)
        obs = env.reset()
-        p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,1)
     
        while 1:
            time.sleep(0.001)
--- a/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_HopperBulletEnv_v0_2017may.py
+++ b/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_HopperBulletEnv_v0_2017may.py
@@ -32,13 +32,10 @@ class SmallReactivePolicy:

 def main():
    env = gym.make("HopperBulletEnv-v0")
+    env.render(mode="human")
    
-    cid = p.connect(p.GUI)
-    p.configureDebugVisualizer(p.COV_ENABLE_GUI,0)
    pi = SmallReactivePolicy(env.observation_space, env.action_space)
-    p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,0)
    env.reset()
-    p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,1)
    for i in range (p.getNumBodies()):
        print(p.getBodyInfo(i))
        if (p.getBodyInfo(i)[1].decode() == "hopper"):
@@ -52,9 +49,7 @@ def main():
        score = 0
        restart_delay = 0
        #disable rendering during reset, makes loading much faster
-        p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,0)
        obs = env.reset()
-        p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,1)
    
        while 1:
            time.sleep(0.001)
--- a/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_HumanoidBulletEnv_v0_2017may.py
+++ b/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_HumanoidBulletEnv_v0_2017may.py
@@ -30,13 +30,9 @@ class SmallReactivePolicy:

 def main():
    env = gym.make("HumanoidBulletEnv-v0")
-
-    cid = p.connect(p.GUI)
-    p.configureDebugVisualizer(p.COV_ENABLE_GUI,0)
+    env.render(mode="human")
    pi = SmallReactivePolicy(env.observation_space, env.action_space)
-    p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,0)
    env.reset()
-    p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,1)
    torsoId = -1
    for i in range (p.getNumBodies()):
        print(p.getBodyInfo(i))
@@ -47,9 +43,7 @@ def main():
        frame = 0
        score = 0
        restart_delay = 0
-        p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,0)
        obs = env.reset()
-        p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,1)
       
        while 1:
            time.sleep(0.001)
--- a/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_InvertedDoublePendulumBulletEnv_v0_2017may.py
+++ b/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_InvertedDoublePendulumBulletEnv_v0_2017may.py
@@ -29,8 +29,7 @@ class SmallReactivePolicy:

 def main():
    env = gym.make("InvertedDoublePendulumBulletEnv-v0")
-
-    cid = p.connect(p.GUI)
+    env.render(mode="human")
   
    pi = SmallReactivePolicy(env.observation_space, env.action_space)

--- a/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_InvertedPendulumBulletEnv_v0_2017may.py
+++ b/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_InvertedPendulumBulletEnv_v0_2017may.py
@@ -30,8 +30,7 @@ class SmallReactivePolicy:
 def main():
    print("create env")
    env = gym.make("InvertedPendulumBulletEnv-v0")
-    print("connecting")
-    cid = p.connect(p.GUI)
+    env.render(mode="human")
    pi = SmallReactivePolicy(env.observation_space, env.action_space)

    while 1:
--- a/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_InvertedPendulumSwingupBulletEnv_v0_2017may.py
+++ b/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_InvertedPendulumSwingupBulletEnv_v0_2017may.py
@@ -29,8 +29,7 @@ class SmallReactivePolicy:

 def main():
    env = gym.make("InvertedPendulumSwingupBulletEnv-v0")
-
-    cid = p.connect(p.GUI)
+    env.render(mode="human")
   
    pi = SmallReactivePolicy(env.observation_space, env.action_space)

--- a/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_Walker2DBulletEnv_v0_2017may.py
+++ b/examples/pybullet/gym/pybullet_envs/examples/enjoy_TF_Walker2DBulletEnv_v0_2017may.py
@@ -29,15 +29,10 @@ class SmallReactivePolicy:

 def main():
    env = gym.make("Walker2DBulletEnv-v0")
-
-    cid = p.connect(p.GUI)
-    p.configureDebugVisualizer(p.COV_ENABLE_GUI,0)
+    env.render(mode="human")
    pi = SmallReactivePolicy(env.observation_space, env.action_space)

-    p.configureDebugVisualizer(p.COV_ENABLE_GUI,0)
-    p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,0)
    env.reset()
-    p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,1)
    torsoId = -1
    for i in range (p.getNumBodies()):
        print(p.getBodyInfo(i))
--- a/examples/pybullet/gym/pybullet_envs/gym_locomotion_envs.py
+++ b/examples/pybullet/gym/pybullet_envs/gym_locomotion_envs.py
@@ -1,12 +1,15 @@
 from .scene_stadium import SinglePlayerStadiumScene
 from .env_bases import MJCFBaseBulletEnv
 import numpy as np
+import pybullet as p
 from robot_locomotors import Hopper, Walker2D, HalfCheetah, Ant, Humanoid


 class WalkerBaseBulletEnv(MJCFBaseBulletEnv):
-	def __init__(self, robot):
-		MJCFBaseBulletEnv.__init__(self, robot)
+	def __init__(self, robot, render=False):
+		print("WalkerBase::__init__")
+		MJCFBaseBulletEnv.__init__(self, robot, render)
+		
 		self.camera_x = 0
 		self.walk_target_x = 1e3  # kilometer away
 		self.walk_target_y = 0
@@ -16,11 +19,15 @@ class WalkerBaseBulletEnv(MJCFBaseBulletEnv):
 		return self.stadium_scene

 	def _reset(self):
+		
 		r = MJCFBaseBulletEnv._reset(self)
+		p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,0)
+
 		self.parts, self.jdict, self.ordered_joints, self.robot_body = self.robot.addToScene(
 			self.stadium_scene.ground_plane_mjcf)
 		self.ground_ids = set([(self.parts[f].bodies[self.parts[f].bodyIndex], self.parts[f].bodyPartIndex) for f in
 							   self.foot_ground_object_names])
+		p.configureDebugVisualizer(p.COV_ENABLE_RENDERING,1)
 		return r

 	def move_robot(self, init_x, init_y, init_z):