bullet3/examples/pybullet/gym/pybullet_envs/deep_mimic/testrl.py

import time
import os
import inspect
currentdir = os.path.dirname(os.path.abspath(inspect.getfile(inspect.currentframe())))
parentdir = os.path.dirname(os.path.dirname(currentdir))
os.sys.path.insert(0, parentdir)
print("parentdir=", parentdir)
import json
from pybullet_envs.deep_mimic.learning.rl_world import RLWorld
from pybullet_envs.deep_mimic.learning.ppo_agent import PPOAgent

import pybullet_data
from pybullet_utils.arg_parser import ArgParser
from pybullet_utils.logger import Logger
from pybullet_envs.deep_mimic.env.pybullet_deep_mimic_env import PyBulletDeepMimicEnv
import sys
import random

update_timestep = 1. / 240.
animating = True
step = False
total_reward = 0
steps = 0

def update_world(world, time_elapsed):
  timeStep = update_timestep
  world.update(timeStep)
  reward = world.env.calc_reward(agent_id=0)
  global total_reward
  total_reward += reward
  global steps
  steps+=1
  
  #print("reward=",reward)
  #print("steps=",steps)
  end_episode = world.env.is_episode_end()
  if (end_episode or steps>= 1000):
    print("total_reward=",total_reward)
    total_reward=0
    steps = 0
    world.end_episode()
    world.reset()
  return


def build_arg_parser(args):
  arg_parser = ArgParser()
  arg_parser.load_args(args)

  arg_file = arg_parser.parse_string('arg_file', '')
  if arg_file == '':
    arg_file = "run_humanoid3d_backflip_args.txt"
  if (arg_file != ''):
    path = pybullet_data.getDataPath() + "/args/" + arg_file
    succ = arg_parser.load_file(path)
    Logger.print2(arg_file)
    assert succ, Logger.print2('Failed to load args from: ' + arg_file)
  return arg_parser


args = sys.argv[1:]


def build_world(args, enable_draw):
  arg_parser = build_arg_parser(args)
  print("enable_draw=", enable_draw)
  env = PyBulletDeepMimicEnv(arg_parser, enable_draw)
  world = RLWorld(env, arg_parser)
  #world.env.set_playback_speed(playback_speed)

  motion_file = arg_parser.parse_string("motion_file")
  print("motion_file=", motion_file)
  bodies = arg_parser.parse_ints("fall_contact_bodies")
  print("bodies=", bodies)
  int_output_path = arg_parser.parse_string("int_output_path")
  print("int_output_path=", int_output_path)
  agent_files = pybullet_data.getDataPath() + "/" + arg_parser.parse_string("agent_files")

  AGENT_TYPE_KEY = "AgentType"

  print("agent_file=", agent_files)
  with open(agent_files) as data_file:
    json_data = json.load(data_file)
    print("json_data=", json_data)
    assert AGENT_TYPE_KEY in json_data
    agent_type = json_data[AGENT_TYPE_KEY]
    print("agent_type=", agent_type)
    agent = PPOAgent(world, id, json_data)

    agent.set_enable_training(False)
    world.reset()
  return world


if __name__ == '__main__':

  world = build_world(args, True)
  while (world.env._pybullet_client.isConnected()):

    timeStep = update_timestep
    time.sleep(timeStep)
    keys = world.env.getKeyboardEvents()

    if world.env.isKeyTriggered(keys, ' '):
      animating = not animating
    if world.env.isKeyTriggered(keys, 'i'):
      step = True
    if (animating or step):
      update_world(world, timeStep)
      step = False
deep_mimic: replace retrained backflip policy 2019-07-23 14:27:17 +00:00			`import time`
enable deepmimic training on mac 2019-02-02 00:24:48 +00:00			`import os`
			`import inspect`
			`currentdir = os.path.dirname(os.path.abspath(inspect.getfile(inspect.currentframe())))`
			`parentdir = os.path.dirname(os.path.dirname(currentdir))`
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`os.sys.path.insert(0, parentdir)`
			`print("parentdir=", parentdir)`
enable stable PD plugin in premake4.lua PyBullet add a normalize in the setRotation axis/angle to be sure. Add more code from the DeepMimic project, training doesn't work yet. 2019-02-01 05:31:26 +00:00			`import json`
enable deepmimic training on mac 2019-02-02 00:24:48 +00:00			`from pybullet_envs.deep_mimic.learning.rl_world import RLWorld`
fixes in PyBullet deep_mimic to allow running in pip version 2019-02-11 16:51:07 +00:00			`from pybullet_envs.deep_mimic.learning.ppo_agent import PPOAgent`
enable stable PD plugin in premake4.lua PyBullet add a normalize in the setRotation axis/angle to be sure. Add more code from the DeepMimic project, training doesn't work yet. 2019-02-01 05:31:26 +00:00
			`import pybullet_data`
			`from pybullet_utils.arg_parser import ArgParser`
			`from pybullet_utils.logger import Logger`
			`from pybullet_envs.deep_mimic.env.pybullet_deep_mimic_env import PyBulletDeepMimicEnv`
			`import sys`
			`import random`

add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`update_timestep = 1. / 240.`
allow pybullet_envs.deep_mimic.testrl --arg_file run_humanoid3d_backflip_args.txt to perform a backflip. Can only backflip twice, then drops on ground. this deepmimic is still very slow, due to slow mass matrix/inverse dynamics computation. once spherical motor drive is enabled, it should be fast(er) move pd_controller_stable to pybullet_utils for easier re-use add plane_transparent.urdf to pybullet_data allow spacebar in keyboardEvents (Windows for now) 2019-02-11 04:56:31 +00:00			`animating = True`
deep_mimic: replace retrained backflip policy 2019-07-23 14:27:17 +00:00			`step = False`
set correct reward for deep_mimic gymenv (max episode = 1000 steps, 1 reward at each step) terminate testrl.py at 1000, show reward 2020-03-02 05:27:30 +00:00			`total_reward = 0`
			`steps = 0`
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00
add mpi_run version (not working yet) 2019-02-02 01:57:31 +00:00			`def update_world(world, time_elapsed):`
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`timeStep = update_timestep`
			`world.update(timeStep)`
			`reward = world.env.calc_reward(agent_id=0)`
set correct reward for deep_mimic gymenv (max episode = 1000 steps, 1 reward at each step) terminate testrl.py at 1000, show reward 2020-03-02 05:27:30 +00:00			`global total_reward`
			`total_reward += reward`
			`global steps`
			`steps+=1`

add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`#print("reward=",reward)`
set correct reward for deep_mimic gymenv (max episode = 1000 steps, 1 reward at each step) terminate testrl.py at 1000, show reward 2020-03-02 05:27:30 +00:00			`#print("steps=",steps)`
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`end_episode = world.env.is_episode_end()`
set correct reward for deep_mimic gymenv (max episode = 1000 steps, 1 reward at each step) terminate testrl.py at 1000, show reward 2020-03-02 05:27:30 +00:00			`if (end_episode or steps>= 1000):`
			`print("total_reward=",total_reward)`
			`total_reward=0`
			`steps = 0`
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`world.end_episode()`
			`world.reset()`
			`return`

add mpi_run version (not working yet) 2019-02-02 01:57:31 +00:00
enable stable PD plugin in premake4.lua PyBullet add a normalize in the setRotation axis/angle to be sure. Add more code from the DeepMimic project, training doesn't work yet. 2019-02-01 05:31:26 +00:00			`def build_arg_parser(args):`
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`arg_parser = ArgParser()`
			`arg_parser.load_args(args)`
enable stable PD plugin in premake4.lua PyBullet add a normalize in the setRotation axis/angle to be sure. Add more code from the DeepMimic project, training doesn't work yet. 2019-02-01 05:31:26 +00:00
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`arg_file = arg_parser.parse_string('arg_file', '')`
enable self-collision for deep_mimic pybullet_envs and make it easier to try it out: python3 -m pybullet_envs.deep_mimic.testrl 2019-11-30 21:19:28 +00:00			`if arg_file == '':`
			`arg_file = "run_humanoid3d_backflip_args.txt"`
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`if (arg_file != ''):`
			`path = pybullet_data.getDataPath() + "/args/" + arg_file`
			`succ = arg_parser.load_file(path)`
			`Logger.print2(arg_file)`
			`assert succ, Logger.print2('Failed to load args from: ' + arg_file)`
			`return arg_parser`
enable stable PD plugin in premake4.lua PyBullet add a normalize in the setRotation axis/angle to be sure. Add more code from the DeepMimic project, training doesn't work yet. 2019-02-01 05:31:26 +00:00

add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`args = sys.argv[1:]`
enable stable PD plugin in premake4.lua PyBullet add a normalize in the setRotation axis/angle to be sure. Add more code from the DeepMimic project, training doesn't work yet. 2019-02-01 05:31:26 +00:00

update mpi usage 2019-02-02 03:20:08 +00:00			`def build_world(args, enable_draw):`
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`arg_parser = build_arg_parser(args)`
			`print("enable_draw=", enable_draw)`
			`env = PyBulletDeepMimicEnv(arg_parser, enable_draw)`
			`world = RLWorld(env, arg_parser)`
			`#world.env.set_playback_speed(playback_speed)`

			`motion_file = arg_parser.parse_string("motion_file")`
			`print("motion_file=", motion_file)`
			`bodies = arg_parser.parse_ints("fall_contact_bodies")`
			`print("bodies=", bodies)`
			`int_output_path = arg_parser.parse_string("int_output_path")`
			`print("int_output_path=", int_output_path)`
			`agent_files = pybullet_data.getDataPath() + "/" + arg_parser.parse_string("agent_files")`

			`AGENT_TYPE_KEY = "AgentType"`

			`print("agent_file=", agent_files)`
			`with open(agent_files) as data_file:`
			`json_data = json.load(data_file)`
			`print("json_data=", json_data)`
			`assert AGENT_TYPE_KEY in json_data`
			`agent_type = json_data[AGENT_TYPE_KEY]`
			`print("agent_type=", agent_type)`
			`agent = PPOAgent(world, id, json_data)`

			`agent.set_enable_training(False)`
			`world.reset()`
			`return world`


update mpi usage 2019-02-02 03:20:08 +00:00			`if __name__ == '__main__':`
add mpi_run version (not working yet) 2019-02-02 01:57:31 +00:00
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`world = build_world(args, True)`
			`while (world.env._pybullet_client.isConnected()):`
deep_mimic: replace retrained backflip policy 2019-07-23 14:27:17 +00:00
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`timeStep = update_timestep`
deep_mimic: replace retrained backflip policy 2019-07-23 14:27:17 +00:00			`time.sleep(timeStep)`
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`keys = world.env.getKeyboardEvents()`

			`if world.env.isKeyTriggered(keys, ' '):`
			`animating = not animating`
deep_mimic: replace retrained backflip policy 2019-07-23 14:27:17 +00:00			`if world.env.isKeyTriggered(keys, 'i'):`
			`step = True`
			`if (animating or step):`
add yapf style and apply yapf to format all Python files This recreates pull request #2192 2019-04-27 14:31:15 +00:00			`update_world(world, timeStep)`
deep_mimic: replace retrained backflip policy 2019-07-23 14:27:17 +00:00			`step = False`