diff --git a/examples/pybullet/gym/pybullet_envs/deep_mimic/env/pd_controller_stable.py b/examples/pybullet/gym/pybullet_envs/deep_mimic/env/pd_controller_stable.py
index 76f13bbf5..bb0f5f243 100644
--- a/examples/pybullet/gym/pybullet_envs/deep_mimic/env/pd_controller_stable.py
+++ b/examples/pybullet/gym/pybullet_envs/deep_mimic/env/pd_controller_stable.py
@@ -141,4 +141,4 @@ class PDControllerStable(object):
 			maxF = np.array(maxForces)
 			forces = np.clip(tau, -maxF , maxF )
 			#print("c=",c)
-			return tau
\ No newline at end of file
+			return tau
diff --git a/examples/pybullet/gym/pybullet_envs/deep_mimic/env/pybullet_deep_mimic_env.py b/examples/pybullet/gym/pybullet_envs/deep_mimic/env/pybullet_deep_mimic_env.py
index f7c42e457..380c90cbc 100644
--- a/examples/pybullet/gym/pybullet_envs/deep_mimic/env/pybullet_deep_mimic_env.py
+++ b/examples/pybullet/gym/pybullet_envs/deep_mimic/env/pybullet_deep_mimic_env.py
@@ -22,8 +22,10 @@ class PyBulletDeepMimicEnv(Env):
     def reset(self):
       self.t = 0
       if not self._isInitialized:
-        self._pybullet_client =  bullet_client.BulletClient(connection_mode=p1.GUI)
-        #self._pybullet_client  =  bullet_client.BulletClient()
+        if self.enable_draw:
+          self._pybullet_client =  bullet_client.BulletClient(connection_mode=p1.GUI)
+        else:
+          self._pybullet_client  =  bullet_client.BulletClient()
         
         self._pybullet_client.setAdditionalSearchPath(pybullet_data.getDataPath())
         z2y = self._pybullet_client.getQuaternionFromEuler([-math.pi*0.5,0,0])
@@ -198,7 +200,7 @@ class PyBulletDeepMimicEnv(Env):
         state = self._humanoid.getState()
         state[1]=state[1]+0.008
         #print("record_state=",state)
-        return state
+        return np.array(state)
         
         
     def record_goal(self, agent_id):
@@ -241,11 +243,11 @@ class PyBulletDeepMimicEnv(Env):
     def is_episode_end(self):
       isEnded = self._humanoid.terminates()
       #also check maximum time, 20 seconds (todo get from file)
-      print("self.t=",self.t)
+      #print("self.t=",self.t)
       if (self.t>3):
         isEnded = True
       return isEnded
       
     def check_valid_episode(self):
       #could check if limbs exceed velocity threshold
-      return true
\ No newline at end of file
+      return true
diff --git a/examples/pybullet/gym/pybullet_envs/deep_mimic/learning/agent_builder.py b/examples/pybullet/gym/pybullet_envs/deep_mimic/learning/agent_builder.py
index e664645aa..ca54f46d5 100644
--- a/examples/pybullet/gym/pybullet_envs/deep_mimic/learning/agent_builder.py
+++ b/examples/pybullet/gym/pybullet_envs/deep_mimic/learning/agent_builder.py
@@ -1,12 +1,13 @@
 import json
 import numpy as np
 from learning.ppo_agent import PPOAgent
+import pybullet_data
 
 AGENT_TYPE_KEY = "AgentType"
 
 def build_agent(world, id, file):
     agent = None
-    with open(file) as data_file:    
+    with open(pybullet_data.getDataPath()+"/"+file) as data_file:    
         json_data = json.load(data_file)
         
         assert AGENT_TYPE_KEY in json_data
@@ -17,4 +18,4 @@ def build_agent(world, id, file):
         else:
             assert False, 'Unsupported agent type: ' + agent_type
 
-    return agent
\ No newline at end of file
+    return agent
diff --git a/examples/pybullet/gym/pybullet_envs/deep_mimic/learning/replay_buffer.py b/examples/pybullet/gym/pybullet_envs/deep_mimic/learning/replay_buffer.py
index a898f59d4..284515851 100644
--- a/examples/pybullet/gym/pybullet_envs/deep_mimic/learning/replay_buffer.py
+++ b/examples/pybullet/gym/pybullet_envs/deep_mimic/learning/replay_buffer.py
@@ -2,7 +2,7 @@ import numpy as np
 import copy
 from pybullet_utils.logger import Logger
 import inspect as inspect
-from env.env import Env
+from pybullet_envs.deep_mimic.env.env import Env
 import pybullet_utils.math_util as MathUtil
 
 class ReplayBuffer(object):
@@ -348,4 +348,4 @@ class SampleBuffer(object):
         count0 = np.sum(self.idx_to_slot == MathUtil.INVALID_IDX)
         count1 = np.sum(self.slot_to_idx == MathUtil.INVALID_IDX)
         valid &= count0 == count1
-        return valid
\ No newline at end of file
+        return valid
diff --git a/examples/pybullet/gym/pybullet_envs/deep_mimic/testrl.py b/examples/pybullet/gym/pybullet_envs/deep_mimic/testrl.py
index 1ea840ffb..2d82e4521 100644
--- a/examples/pybullet/gym/pybullet_envs/deep_mimic/testrl.py
+++ b/examples/pybullet/gym/pybullet_envs/deep_mimic/testrl.py
@@ -1,5 +1,11 @@
+import os
+import inspect
+currentdir = os.path.dirname(os.path.abspath(inspect.getfile(inspect.currentframe())))
+parentdir = os.path.dirname(os.path.dirname(currentdir))
+os.sys.path.insert(0,parentdir)
+print("parentdir=",parentdir)
 import json
-from learning.rl_world import RLWorld
+from pybullet_envs.deep_mimic.learning.rl_world import RLWorld
 from learning.ppo_agent import PPOAgent
 
 import pybullet_data
@@ -36,7 +42,7 @@ print("bodies=",bodies)
 int_output_path = arg_parser.parse_string("int_output_path")
 print("int_output_path=",int_output_path)
 
-agent_files = arg_parser.parse_string("agent_files")
+agent_files = pybullet_data.getDataPath()+"/"+arg_parser.parse_string("agent_files")
 
 AGENT_TYPE_KEY = "AgentType"