Unity-Technologies
diff --git a/‎colab/Colab_UnityEnvironment_4_SB3VectorEnv.ipynb
Lines changed: 323 additions & 0 deletions b/‎colab/Colab_UnityEnvironment_4_SB3VectorEnv.ipynb
Lines changed: 323 additions & 0 deletions
diff --git a/‎com.unity.ml-agents/CHANGELOG.md
Lines changed: 1 addition & 0 deletions b/‎com.unity.ml-agents/CHANGELOG.md
Lines changed: 1 addition & 0 deletions
diff --git a/‎ml-agents-envs/mlagents_envs/envs/unity_gym_env.py
Lines changed: 1 addition & 0 deletions b/‎ml-agents-envs/mlagents_envs/envs/unity_gym_env.py
Lines changed: 1 addition & 0 deletions
@@ -0,0 +1,323 @@
+{
+ "nbformat": 4,
+ "nbformat_minor": 0,
+ "metadata": {
+  "colab": {
+   "name": "Colab-UnityEnvironment-1-Run.ipynb",
+   "private_outputs": true,
+   "provenance": [],
+   "collapsed_sections": [],
+   "toc_visible": true
+  },
+  "kernelspec": {
+   "name": "python3",
+   "language": "python",
+   "display_name": "Python 3"
+  }
+ },
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "pbVXrmEsLXDt"
+   },
+   "source": [
+    "# ML-Agents run with Stable Baselines 3\n",
+    "<img src=\"https://github.com/Unity-Technologies/ml-agents/blob/release_19_docs/docs/images/image-banner.png?raw=true\" align=\"middle\" width=\"435\"/>"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "WNKTwHU3d2-l"
+   },
+   "source": [
+    "## Setup"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "outputs": [],
+   "source": [
+    "#@title Install Rendering Dependencies { display-mode: \"form\" }\n",
+    "#@markdown (You only need to run this code when using Colab's hosted runtime)\n",
+    "\n",
+    "import os\n",
+    "from IPython.display import HTML, display\n",
+    "\n",
+    "def progress(value, max=100):\n",
+    "    return HTML(\"\"\"\n",
+    "        <progress\n",
+    "            value='{value}'\n",
+    "            max='{max}',\n",
+    "            style='width: 100%'\n",
+    "        >\n",
+    "            {value}\n",
+    "        </progress>\n",
+    "    \"\"\".format(value=value, max=max))\n",
+    "\n",
+    "pro_bar = display(progress(0, 100), display_id=True)\n",
+    "\n",
+    "try:\n",
+    "  import google.colab\n",
+    "  INSTALL_XVFB = True\n",
+    "except ImportError:\n",
+    "  INSTALL_XVFB = 'COLAB_ALWAYS_INSTALL_XVFB' in os.environ\n",
+    "\n",
+    "if INSTALL_XVFB:\n",
+    "  with open('frame-buffer', 'w') as writefile:\n",
+    "    writefile.write(\"\"\"#taken from https://gist.github.com/jterrace/2911875\n",
+    "XVFB=/usr/bin/Xvfb\n",
+    "XVFBARGS=\":1 -screen 0 1024x768x24 -ac +extension GLX +render -noreset\"\n",
+    "PIDFILE=./frame-buffer.pid\n",
+    "case \"$1\" in\n",
+    "  start)\n",
+    "    echo -n \"Starting virtual X frame buffer: Xvfb\"\n",
+    "    /sbin/start-stop-daemon --start --quiet --pidfile $PIDFILE --make-pidfile --background --exec $XVFB -- $XVFBARGS\n",
+    "    echo \".\"\n",
+    "    ;;\n",
+    "  stop)\n",
+    "    echo -n \"Stopping virtual X frame buffer: Xvfb\"\n",
+    "    /sbin/start-stop-daemon --stop --quiet --pidfile $PIDFILE\n",
+    "    rm $PIDFILE\n",
+    "    echo \".\"\n",
+    "    ;;\n",
+    "  restart)\n",
+    "    $0 stop\n",
+    "    $0 start\n",
+    "    ;;\n",
+    "  *)\n",
+    "        echo \"Usage: /etc/init.d/xvfb {start|stop|restart}\"\n",
+    "        exit 1\n",
+    "esac\n",
+    "exit 0\n",
+    "    \"\"\")\n",
+    "  !sudo apt-get update\n",
+    "  pro_bar.update(progress(10, 100))\n",
+    "  !sudo DEBIAN_FRONTEND=noninteractive apt install -y daemon wget gdebi-core build-essential libfontenc1 libfreetype6 xorg-dev xorg\n",
+    "  pro_bar.update(progress(20, 100))\n",
+    "  !wget http://security.ubuntu.com/ubuntu/pool/main/libx/libxfont/libxfont1_1.5.1-1ubuntu0.16.04.4_amd64.deb 2>&1\n",
+    "  pro_bar.update(progress(30, 100))\n",
+    "  !wget --output-document xvfb.deb http://security.ubuntu.com/ubuntu/pool/universe/x/xorg-server/xvfb_1.18.4-0ubuntu0.12_amd64.deb 2>&1\n",
+    "  pro_bar.update(progress(40, 100))\n",
+    "  !sudo dpkg -i libxfont1_1.5.1-1ubuntu0.16.04.4_amd64.deb 2>&1\n",
+    "  pro_bar.update(progress(50, 100))\n",
+    "  !sudo dpkg -i xvfb.deb 2>&1\n",
+    "  pro_bar.update(progress(70, 100))\n",
+    "  !rm libxfont1_1.5.1-1ubuntu0.16.04.4_amd64.deb\n",
+    "  pro_bar.update(progress(80, 100))\n",
+    "  !rm xvfb.deb\n",
+    "  pro_bar.update(progress(90, 100))\n",
+    "  !bash frame-buffer start\n",
+    "  os.environ[\"DISPLAY\"] = \":1\"\n",
+    "pro_bar.update(progress(100, 100))"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "Pzj7wgapAcDs"
+   },
+   "source": [
+    "### Installing ml-agents"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "metadata": {
+    "id": "N8yfQqkbebQ5",
+    "pycharm": {
+     "is_executing": true
+    }
+   },
+   "source": [
+    "try:\n",
+    "  import mlagents\n",
+    "  print(\"ml-agents already installed\")\n",
+    "except ImportError:\n",
+    "  !python -m pip install -q mlagents==0.28.0\n",
+    "  print(\"Installed ml-agents\")"
+   ],
+   "execution_count": null,
+   "outputs": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "_u74YhSmW6gD"
+   },
+   "source": [
+    "## Run the Environment"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "P-r_cB2rqp5x"
+   },
+   "source": [
+    "### Import dependencies and set some high level parameters."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "metadata": {
+    "id": "YSf-WhxbqtLw"
+   },
+   "source": [
+    "from math import ceil\n",
+    "\n",
+    "from stable_baselines3 import PPO\n",
+    "from stable_baselines3.common.vec_env import VecMonitor\n",
+    "\n",
+    "from mlagents_envs.envs.unity_vec_env import make_mla_sb3_env, LimitedConfig\n",
+    "\n",
+    "# 250K should train to a reward ~= 0.90 for the \"Basic\" environment.\n",
+    "# We set the value lower here to demonstrate just a small amount of trianing.\n",
+    "TOTAL_TAINING_STEPS_GOAL = 40 * 1000\n",
+    "NUM_ENVS = 12\n",
+    "STEPS_PER_UPDATE = 2048"
+   ],
+   "execution_count": 29,
+   "outputs": []
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "### Start Environment from the registry"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "outputs": [],
+   "source": [
+    "# -----------------\n",
+    "# This code is used to close an env that might not have been closed before\n",
+    "try:\n",
+    "  env.close()\n",
+    "except:\n",
+    "  pass\n",
+    "# -----------------\n",
+    "\n",
+    "env = make_mla_sb3_env(\n",
+    "    config=LimitedConfig(\n",
+    "        env_path_or_name='Basic',  # Can use any name from a registry or a path to your own unity build.\n",
+    "        base_port=6006,\n",
+    "        base_seed=42,\n",
+    "        num_env=NUM_ENVS,\n",
+    "        allow_multiple_obs=True,\n",
+    "    ),\n",
+    "    no_graphics=True,  # Set to false if you are running locally and want to watch the environments move around as they train.\n",
+    ")"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n",
+     "is_executing": true
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "### Create the model"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "outputs": [],
+   "source": [
+    "# Helps gather stats for our eval() calls later so we can see reward stats.\n",
+    "env = VecMonitor(env)\n",
+    "# Attempt to approximate settings from 3DBall.yaml\n",
+    "model = PPO(\n",
+    "    \"MlpPolicy\",\n",
+    "    env,\n",
+    "    verbose=1,\n",
+    "    learning_rate=lambda prog: 0.0003 * (1.0 - prog),\n",
+    "    # Uncomment this if you want to log tensorboard results when running this notebook locally.\n",
+    "    # tensorboard_log=\"results\",\n",
+    "    n_steps=int(STEPS_PER_UPDATE),\n",
+    ")"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n",
+     "is_executing": true
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "### Train the model"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "outputs": [],
+   "source": [
+    "training_rounds = ceil(TOTAL_TAINING_STEPS_GOAL / int(STEPS_PER_UPDATE * NUM_ENVS))\n",
+    "for i in range(training_rounds):\n",
+    "    print(f\"Training round {i + 1}/{training_rounds}\")\n",
+    "    # NOTE: rest_num_timesteps should only happen the first time so that tensorboard logs are consistent.\n",
+    "    model.learn(total_timesteps=6000, reset_num_timesteps=(i == 0))\n",
+    "    model.policy.eval()"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n",
+     "is_executing": true
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "h1lIx3_l24OP"
+   },
+   "source": [
+    "### Close the environment\n",
+    "Frees up the ports being used."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "metadata": {
+    "id": "vdWG6_SqtNtv",
+    "pycharm": {
+     "is_executing": true,
+     "name": "#%%\n"
+    }
+   },
+   "source": [
+    "env.close()\n",
+    "print(\"Closed environment\")\n"
+   ],
+   "execution_count": null,
+   "outputs": []
+  }
+ ]
+}
@@ -17,6 +17,7 @@ and this project adheres to
 ### Minor Changes
 #### com.unity.ml-agents / com.unity.ml-agents.extensions (C#)
 #### ml-agents / ml-agents-envs
+- Added the new unity_vec_env file to the ml-agents-envs module
 - Extended support to python 3.9.10
 
 ### Bug Fixes
 
@@ -1,4 +1,5 @@
 import itertools
+
 import numpy as np
 from typing import Any, Dict, List, Optional, Tuple, Union
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,5 @@`
`1`	`1`	`import itertools`
	`2`	`+`
`2`	`3`	`import numpy as np`
`3`	`4`	`from typing import Any, Dict, List, Optional, Tuple, Union`
`4`	`5`