more fixes for pybullet

2017-08-22 09:32:16 -07:00
parent dd4cc5f4ef
commit 21ca6a90f0
3 changed files with 1 additions and 120 deletions
--- a/examples/pybullet/gym/cartpole_bullet_gym_example.py
+++ b/examples/pybullet/gym/cartpole_bullet_gym_example.py
@@ -1,31 +0,0 @@
 """One-line documentation for gym_example module.
 A detailed description of gym_example.
 """
 import gym
 from envs.bullet.cartpole_bullet import CartPoleBulletEnv
 import setuptools
 import time
 import numpy as np
 w = [0.3, 0.02, 0.02, 0.012]
 def main():
  env = gym.make('CartPoleBulletEnv-v0')
  for i_episode in range(1):
    observation = env.reset()
    done = False
    t = 0
    while not done:
        print(observation)
        action = np.array([np.inner(observation, w)])
        print(action)
        observation, reward, done, info = env.step(action)
        t = t + 1
        if done:
            print("Episode finished after {} timesteps".format(t+1))
            break
 main()
--- a/examples/pybullet/gym/enjoy_TF_AntBulletEnv_v0_2017may.py
+++ b/examples/pybullet/gym/enjoy_TF_AntBulletEnv_v0_2017may.py
@@ -1,7 +1,7 @@
 import gym
 import numpy as np
 import pybullet as p
-from .. import pybullet_envs
+import pybullet_envs
 import time
 def relu(x):
--- a/examples/pybullet/gym/minitaurGymEnvTest.py
+++ b/examples/pybullet/gym/minitaurGymEnvTest.py
@@ -1,88 +0,0 @@
 '''
 A test for minitaurGymEnv
 '''
 import gym
 import numpy as np
 import math
 import numpy as np
 import tensorflow as tf
 from pybullet_envs.bullet.minitaurGymEnv import MinitaurGymEnv
 try:
  import sonnet
  from agents import simpleAgentWithSonnet as agent_lib
 except ImportError:
  from agents import simpleAgent as agent_lib
 def testSinePolicy():
  """Tests sine policy
    """
  np.random.seed(47)
  environment = MinitaurGymEnv(render=True)
  sum_reward = 0
  steps = 1000
  amplitude1Bound = 0.5
  amplitude2Bound = 0.15
  speed = 40
  for stepCounter in range(steps):
    t = float(stepCounter) * environment._timeStep
    if (t < 1):
      amplitude1 = 0
      amplitude2 = 0
    else:
      amplitude1 = amplitude1Bound
      amplitude2 = amplitude2Bound
    a1 = math.sin(t*speed)*amplitude1
    a2 = math.sin(t*speed+3.14)*amplitude1
    a3 = math.sin(t*speed)*amplitude2
    a4 = math.sin(t*speed+3.14)*amplitude2
    action = [a1, a2, a2, a1, a3, a4, a4, a3]
    state, reward, done, info = environment.step(action)
    sum_reward += reward
    if done:
      environment.reset()
      print("sum reward: ", sum_reward)
 def testDDPGPolicy():
  """Tests sine policy
    """
  environment = MinitaurGymEnv(render=True)
  sum_reward = 0
  steps = 1000
  ckpt_path = 'data/agent/tf_graph_data/tf_graph_data_converted.ckpt-0'
  observation_shape = (28,)
  action_size = 8
  actor_layer_size = (297, 158)
  n_steps = 0
  tf.reset_default_graph()
  with tf.Session() as session:
    agent = agent_lib.SimpleAgent(session=session, ckpt_path=ckpt_path, actor_layer_size=actor_layer_size)
    state = environment.reset()
    action = agent(state)
    for _ in range(steps):
      n_steps += 1
      state, reward, done, info = environment.step(action)
      action = agent(state)
      sum_reward += reward
      if done:
        environment.reset()
        n_steps += 1
        print("total reward: ", sum_reward)
        print("total steps:  ", n_steps)
        sum_reward = 0
        n_steps = 0
        return
 testDDPGPolicy()
 #testSinePolicy()