add gym to Dockerfiles

Jon Krohn · Jon Krohn · commit 851df66858f5 · 2017-12-08T16:53:00.000-05:00
diff --git a/Dockerfile b/Dockerfile
@@ -14,3 +14,6 @@ RUN pip install keras==2.0.8
 # install NLP packages:
 RUN pip install nltk==3.2.4
 RUN pip install gensim==2.3.0
+
+# install Reinforcement Learning packages:
+RUN pip install gym==0.9.4
diff --git a/Dockerfile-gpu b/Dockerfile-gpu
@@ -181,3 +181,6 @@ RUN pip install keras==2.0.8
 ## Install NLP packages
 RUN pip install nltk==3.2.4
 RUN pip install gensim==2.3.0
+
+# install Reinforcement Learning packages:
+RUN pip install gym==0.9.4
diff --git a/notebooks/experimental/JSAnimate_cartpole.ipynb b/notebooks/experimental/JSAnimate_cartpole.ipynb
@@ -0,0 +1,181 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "%matplotlib inline"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "from JSAnimation.IPython_display import display_animation\n",
+    "from matplotlib import animation\n",
+    "import matplotlib.pyplot as plt\n",
+    "from IPython.display import display"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import gym"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "def display_frames_as_gif(frames):\n",
+    "    \"\"\"\n",
+    "    Displays a list of frames as a gif, with controls\n",
+    "    \"\"\"\n",
+    "    plt.figure(figsize=(frames[0].shape[1] / 72.0, frames[0].shape[0] / 72.0), dpi = 72)\n",
+    "    patch = plt.imshow(frames[0])\n",
+    "    plt.axis('off')\n",
+    "\n",
+    "    def animate(i):\n",
+    "        patch.set_data(frames[i])\n",
+    "\n",
+    "    anim = animation.FuncAnimation(plt.gcf(), animate, frames = len(frames), interval=50)\n",
+    "    display(display_animation(anim, default_mode='loop'))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\r",
+      "Episode 0/40 finished after 13 timesteps\r",
+      "Episode 1/40 finished after 15 timesteps\r",
+      "Episode 2/40 finished after 23 timesteps\r",
+      "Episode 3/40 finished after 13 timesteps\r",
+      "Episode 4/40 finished after 12 timesteps\r",
+      "Episode 5/40 finished after 22 timesteps\r",
+      "Episode 6/40 finished after 21 timesteps\r",
+      "Episode 7/40 finished after 14 timesteps\r",
+      "Episode 8/40 finished after 10 timesteps\r",
+      "Episode 9/40 finished after 18 timesteps\r",
+      "Episode 10/40 finished after 22 timesteps\r",
+      "Episode 11/40 finished after 13 timesteps\r",
+      "Episode 12/40 finished after 20 timesteps\r",
+      "Episode 13/40 finished after 43 timesteps\r",
+      "Episode 14/40 finished after 34 timesteps\r",
+      "Episode 15/40 finished after 32 timesteps\r",
+      "Episode 16/40 finished after 14 timesteps\r",
+      "Episode 17/40 finished after 14 timesteps\r",
+      "Episode 18/40 finished after 16 timesteps\r",
+      "Episode 19/40 finished after 14 timesteps\r",
+      "Episode 20/40 finished after 17 timesteps\r",
+      "Episode 21/40 finished after 20 timesteps\r",
+      "Episode 22/40 finished after 13 timesteps\r",
+      "Episode 23/40 finished after 21 timesteps\r",
+      "Episode 24/40 finished after 12 timesteps\r",
+      "Episode 25/40 finished after 17 timesteps\r",
+      "Episode 26/40 finished after 23 timesteps\r",
+      "Episode 27/40 finished after 30 timesteps\r",
+      "Episode 28/40 finished after 43 timesteps\r",
+      "Episode 29/40 finished after 17 timesteps\r",
+      "Episode 30/40 finished after 28 timesteps\r",
+      "Episode 31/40 finished after 26 timesteps\r",
+      "Episode 32/40 finished after 19 timesteps\r",
+      "Episode 33/40 finished after 15 timesteps\r",
+      "Episode 34/40 finished after 44 timesteps\r",
+      "Episode 35/40 finished after 22 timesteps\r",
+      "Episode 36/40 finished after 70 timesteps\r",
+      "Episode 37/40 finished after 24 timesteps\r",
+      "Episode 38/40 finished after 23 timesteps\r",
+      "Episode 39/40 finished after 15 timesteps"
+     ]
+    }
+   ],
+   "source": [
+    "env = gym.make('CartPole-v0')\n",
+    "cum_reward = 0\n",
+    "frames = []\n",
+    "num_episodes=40\n",
+    "for i_episode in range(num_episodes):\n",
+    "    observation = env.reset()\n",
+    "    for t in range(500):\n",
+    "        # Render into buffer. \n",
+    "        frames.append(env.render(mode = 'rgb_array', close=True))\n",
+    "        action = env.action_space.sample() # random action\n",
+    "        observation, reward, done, info = env.step(action)\n",
+    "        if done:\n",
+    "            print(\"\\rEpisode {}/{} finished after {} timesteps\".format(i_episode, num_episodes, t+1), end=\"\")\n",
+    "            break"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "ename": "AttributeError",
+     "evalue": "'NoneType' object has no attribute 'shape'",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[0;31mAttributeError\u001b[0m                            Traceback (most recent call last)",
+      "\u001b[0;32m<ipython-input-6-d67b09ec9573>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mdisplay_frames_as_gif\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mframes\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
+      "\u001b[0;32m<ipython-input-4-9da36626cf94>\u001b[0m in \u001b[0;36mdisplay_frames_as_gif\u001b[0;34m(frames)\u001b[0m\n\u001b[1;32m      3\u001b[0m     \u001b[0mDisplays\u001b[0m \u001b[0ma\u001b[0m \u001b[0mlist\u001b[0m \u001b[0mof\u001b[0m \u001b[0mframes\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0ma\u001b[0m \u001b[0mgif\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mcontrols\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      4\u001b[0m     \"\"\"\n\u001b[0;32m----> 5\u001b[0;31m     \u001b[0mplt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfigure\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mfigsize\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mframes\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mshape\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m/\u001b[0m \u001b[0;36m72.0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mframes\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mshape\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m/\u001b[0m \u001b[0;36m72.0\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdpi\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;36m72\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m      6\u001b[0m     \u001b[0mpatch\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mplt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mimshow\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mframes\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      7\u001b[0m     \u001b[0mplt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0maxis\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'off'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
+      "\u001b[0;31mAttributeError\u001b[0m: 'NoneType' object has no attribute 'shape'"
+     ]
+    }
+   ],
+   "source": [
+    "display_frames_as_gif(frames)"
+   ]
+  }
+ ],
+ "metadata": {
+  "anaconda-cloud": {},
+  "kernelspec": {
+   "display_name": "Python [conda root]",
+   "language": "python",
+   "name": "conda-root-py"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.5.2"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 1
+}
diff --git a/notebooks/experimental/cartpole.ipynb b/notebooks/experimental/cartpole.ipynb