add DeepMimic helper utils

2018-11-23 18:01:39 -08:00
parent 7669fc92c5
commit 5f0dcb575f
6 changed files with 344 additions and 0 deletions
--- a/examples/pybullet/gym/pybullet_utils/arg_parser.py
+++ b/examples/pybullet/gym/pybullet_utils/arg_parser.py
@@ -0,0 +1,124 @@
+import re as RE
+
+class ArgParser(object):
+    global_parser = None
+
+    def __init__(self):
+        self._table = dict()
+        return
+
+    def clear(self):
+        self._table.clear()
+        return
+
+    def load_args(self, arg_strs):
+        succ = True
+        vals = []
+        curr_key = ''
+
+        for str in arg_strs:
+            if not (self._is_comment(str)):
+                is_key = self._is_key(str)
+                if (is_key):
+                    if (curr_key != ''):
+                        if (curr_key not in self._table):
+                            self._table[curr_key] = vals
+
+                    vals = []
+                    curr_key = str[2::]
+                else:
+                    vals.append(str)
+
+        if (curr_key != ''):
+            if (curr_key not in self._table):
+                self._table[curr_key] = vals
+
+            vals = []
+
+        return succ
+
+    def load_file(self, filename):
+        succ = False
+        with open(filename, 'r') as file:
+            lines = RE.split(r'[\n\r]+', file.read())
+            file.close()
+
+            arg_strs = []
+            for line in lines:
+                if (len(line) > 0 and not self._is_comment(line)):
+                    arg_strs += line.split()
+
+            succ = self.load_args(arg_strs)
+        return succ
+
+    def has_key(self, key):
+        return key in self._table
+
+    def parse_string(self, key, default=''):
+        str = default
+        if self.has_key(key):
+            str = self._table[key][0]
+        return str
+
+    def parse_strings(self, key, default=[]):
+        arr = default
+        if self.has_key(key):
+            arr = self._table[key]
+        return arr
+
+    def parse_int(self, key, default=0):
+        val = default
+        if self.has_key(key):
+            val = int(self._table[key][0])
+        return val
+
+    def parse_ints(self, key, default=[]):
+        arr = default
+        if self.has_key(key):
+            arr = [int(str) for str in self._table[key]]
+        return arr
+
+    def parse_float(self, key, default=0.0):
+        val = default
+        if self.has_key(key):
+            val = float(self._table[key][0])
+        return val
+
+    def parse_floats(self, key, default=[]):
+        arr = default
+        if self.has_key(key):
+            arr = [float(str) for str in self._table[key]]
+        return arr
+
+    def parse_bool(self, key, default=False):
+        val = default
+        if self.has_key(key):
+            val = self._parse_bool(self._table[key][0])
+        return val
+
+    def parse_bools(self, key, default=[]):
+        arr = default
+        if self.has_key(key):
+            arr = [self._parse_bool(str) for str in self._table[key]]
+        return arr
+
+    def _is_comment(self, str):
+        is_comment = False
+        if (len(str) > 0):
+            is_comment = str[0] == '#'
+
+        return is_comment
+        
+    def _is_key(self, str):
+        is_key = False
+        if (len(str) >= 3):
+            is_key = str[0] == '-' and str[1] == '-'
+
+        return is_key
+
+    def _parse_bool(self, str):
+        val = False
+        if (str == 'true' or str == 'True' or str == '1' 
+            or str == 'T' or str == 't'):
+            val = True
+        return val
--- a/examples/pybullet/gym/pybullet_utils/examples/testlog.py
+++ b/examples/pybullet/gym/pybullet_utils/examples/testlog.py
@@ -0,0 +1,9 @@
+from pybullet_utils.logger import Logger
+logger = Logger()
+logger.configure_output_file("e:/mylog.txt")
+for i in range (10):
+	logger.log_tabular("Iteration", 1)
+Logger.print2("hello world")
+
+logger.print_tabular()
+logger.dump_tabular()
--- a/examples/pybullet/gym/pybullet_utils/logger.py
+++ b/examples/pybullet/gym/pybullet_utils/logger.py
@@ -0,0 +1,128 @@
+import pybullet_utils.mpi_util as MPIUtil
+
+"""
+
+Some simple logging functionality, inspired by rllab's logging.
+Assumes that each diagnostic gets logged each iteration
+
+Call logz.configure_output_file() to start logging to a 
+tab-separated-values file (some_file_name.txt)
+
+To load the learning curves, you can do, for example
+
+A = np.genfromtxt('/tmp/expt_1468984536/log.txt',delimiter='\t',dtype=None, names=True)
+A['EpRewMean']
+
+"""
+
+import os.path as osp, shutil, time, atexit, os, subprocess
+
+class Logger:
+    def print2(str):
+        if (MPIUtil.is_root_proc()):
+            print(str)
+        return
+
+    def __init__(self):
+        self.output_file = None
+        self.first_row = True
+        self.log_headers = []
+        self.log_current_row = {}
+        self._dump_str_template = ""
+        return
+
+    def reset(self):
+        self.first_row = True
+        self.log_headers = []
+        self.log_current_row = {}
+        if self.output_file is not None:
+            self.output_file = open(output_path, 'w')
+        return
+
+    def configure_output_file(self, filename=None):
+        """
+        Set output directory to d, or to /tmp/somerandomnumber if d is None
+        """
+        self.first_row = True
+        self.log_headers = []
+        self.log_current_row = {}
+
+        output_path = filename or "output/log_%i.txt"%int(time.time())
+
+        out_dir = os.path.dirname(output_path)
+        if not os.path.exists(out_dir) and MPIUtil.is_root_proc():
+            os.makedirs(out_dir)
+
+        if (MPIUtil.is_root_proc()):
+            self.output_file = open(output_path, 'w')
+            assert osp.exists(output_path)
+            atexit.register(self.output_file.close)
+
+            Logger.print2("Logging data to " + self.output_file.name)
+        return
+
+    def log_tabular(self, key, val):
+        """
+        Log a value of some diagnostic
+        Call this once for each diagnostic quantity, each iteration
+        """
+        if self.first_row and key not in self.log_headers:
+            self.log_headers.append(key)
+        else:
+            assert key in self.log_headers, "Trying to introduce a new key %s that you didn't include in the first iteration"%key
+        self.log_current_row[key] = val
+        return
+
+    def get_num_keys(self):
+        return len(self.log_headers)
+
+    def print_tabular(self):
+        """
+        Print all of the diagnostics from the current iteration
+        """
+        if (MPIUtil.is_root_proc()):
+            vals = []
+            Logger.print2("-"*37)
+            for key in self.log_headers:
+                val = self.log_current_row.get(key, "")
+                if isinstance(val, float):
+                    valstr = "%8.3g"%val
+                elif isinstance(val, int):
+                    valstr = str(val)
+                else: 
+                    valstr = val
+                Logger.print2("| %15s | %15s |"%(key, valstr))
+                vals.append(val)
+            Logger.print2("-" * 37)
+        return
+
+    def dump_tabular(self):
+        """
+        Write all of the diagnostics from the current iteration
+        """
+        if (MPIUtil.is_root_proc()):
+            if (self.first_row):
+                self._dump_str_template = self._build_str_template()
+
+            vals = []
+            for key in self.log_headers:
+                val = self.log_current_row.get(key, "")
+                vals.append(val)
+            
+            if self.output_file is not None:
+                if self.first_row:
+                    header_str = self._dump_str_template.format(*self.log_headers)
+                    self.output_file.write(header_str + "\n")
+
+                val_str = self._dump_str_template.format(*map(str,vals))
+                self.output_file.write(val_str + "\n")
+                self.output_file.flush()
+
+        self.log_current_row.clear()
+        self.first_row=False
+        return
+
+    def _build_str_template(self):
+        num_keys = self.get_num_keys()
+        template = "{:<25}" * num_keys
+        return template
--- a/examples/pybullet/gym/pybullet_utils/math_util.py
+++ b/examples/pybullet/gym/pybullet_utils/math_util.py
@@ -0,0 +1,18 @@
+import numpy as np
+
+RAD_TO_DEG = 57.2957795
+DEG_TO_RAD = 1.0 / RAD_TO_DEG
+INVALID_IDX = -1
+
+def lerp(x, y, t):
+    return (1 - t) * x + t * y
+
+def log_lerp(x, y, t):
+    return np.exp(lerp(np.log(x), np.log(y), t))
+
+def flatten(arr_list):
+    return np.concatenate([np.reshape(a, [-1]) for a in arr_list], axis=0)
+
+def flip_coin(p):
+    rand_num = np.random.binomial(1, p, 1)
+    return rand_num[0] == 1
--- a/examples/pybullet/gym/pybullet_utils/mpi_util.py
+++ b/examples/pybullet/gym/pybullet_utils/mpi_util.py
@@ -0,0 +1,52 @@
+import numpy as np
+from mpi4py import MPI
+
+ROOT_PROC_RANK = 0
+
+def get_num_procs():
+    return MPI.COMM_WORLD.Get_size()
+
+def get_proc_rank():
+    return MPI.COMM_WORLD.Get_rank()
+
+def is_root_proc():
+    rank = get_proc_rank()
+    return rank == ROOT_PROC_RANK
+
+def bcast(x):
+    MPI.COMM_WORLD.Bcast(x, root=ROOT_PROC_RANK)
+    return
+
+def reduce_sum(x):
+    return reduce_all(x, MPI.SUM)
+
+def reduce_prod(x):
+    return reduce_all(x, MPI.PROD)
+
+def reduce_avg(x):
+    buffer = reduce_sum(x)
+    buffer /= get_num_procs()
+    return buffer
+
+def reduce_min(x):
+    return reduce_all(x, MPI.MIN)
+
+def reduce_max(x):
+    return reduce_all(x, MPI.MAX)
+
+def reduce_all(x, op):
+    is_array = isinstance(x, np.ndarray)
+    x_buf = x if is_array else np.array([x])
+    buffer = np.zeros_like(x_buf)
+    MPI.COMM_WORLD.Allreduce(x_buf, buffer, op=op)
+    buffer = buffer if is_array else buffer[0]
+    return buffer
+
+def gather_all(x):
+    is_array = isinstance(x, np.ndarray)
+    x_buf = np.array([x])
+    buffer = np.zeros_like(x_buf)
+    buffer = np.repeat(buffer, get_num_procs(), axis=0)
+    MPI.COMM_WORLD.Allgather(x_buf, buffer)
+    buffer = list(buffer)
+    return buffer
--- a/examples/pybullet/gym/pybullet_utils/util.py
+++ b/examples/pybullet/gym/pybullet_utils/util.py
@@ -0,0 +1,13 @@
+import random
+import numpy as np
+
+def set_global_seeds(seed):
+    try:
+        import tensorflow as tf
+    except ImportError:
+        pass
+    else:
+        tf.set_random_seed(seed)
+    np.random.seed(seed)
+    random.seed(seed)
+    return