Merge branch 'master' into batch-norm

ray-project · Nov 27, 2018 · dedd3a8 · dedd3a8
2 parents 3819373 + e3c088f
commit dedd3a8
Show file tree

Hide file tree

Showing 29 changed files with 483 additions and 1,010 deletions.
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -111,7 +111,10 @@ if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
     list(APPEND ray_file_list "src/credis/redis/src/redis-server")
   endif()
 
-  if (DEFINED ENV{INCLUDE_UI} AND "$ENV{INCLUDE_UI}" STREQUAL "1")
+  # The goal of the if statement below is to require the catapult files to be
+  # present INCLUDE_UI=1 is set and to include the UI files if they are present.
+  # This should match the logic in build_ui.sh.
+  if (EXISTS "${CMAKE_BINARY_DIR}/src/catapult_files/index.html" OR "$ENV{INCLUDE_UI}" STREQUAL "1")
     list(APPEND ray_file_list "src/catapult_files/index.html")
     list(APPEND ray_file_list "src/catapult_files/trace_viewer_full.html")
   endif()

diff --git a/doc/source/rllib-algorithms.rst b/doc/source/rllib-algorithms.rst
@@ -119,12 +119,12 @@ SpaceInvaders  692                       ~600
    :start-after: __sphinx_doc_begin__
    :end-before: __sphinx_doc_end__
 
-Deep Deterministic Policy Gradients (DDPG)
-------------------------------------------
+Deep Deterministic Policy Gradients (DDPG, TD3)
+-----------------------------------------------
 `[paper] <https://arxiv.org/abs/1509.02971>`__ `[implementation] <https://github.com/ray-project/ray/blob/master/python/ray/rllib/agents/ddpg/ddpg.py>`__
-DDPG is implemented similarly to DQN (below). The algorithm can be scaled by increasing the number of workers, switching to AsyncGradientsOptimizer, or using Ape-X.
+DDPG is implemented similarly to DQN (below). The algorithm can be scaled by increasing the number of workers, switching to AsyncGradientsOptimizer, or using Ape-X. The improvements from `TD3 <https://spinningup.openai.com/en/latest/algorithms/td3.html>`__ are available though not enabled by default.
 
-Tuned examples: `Pendulum-v0 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml>`__, `MountainCarContinuous-v0 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml>`__, `HalfCheetah-v2 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml>`__
+Tuned examples: `Pendulum-v0 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml>`__, `TD3 configuration <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pendulum-td3.yaml>`__, `MountainCarContinuous-v0 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml>`__, `HalfCheetah-v2 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml>`__
 
 **DDPG-specific configs** (see also `common configs <rllib-training.html#common-parameters>`__):
 

diff --git a/doc/source/rllib-env.rst b/doc/source/rllib-env.rst
@@ -15,7 +15,7 @@ PPO             **Yes**           **Yes**             **Yes**      **Yes**
 PG              **Yes**           **Yes**             **Yes**      **Yes**
 IMPALA          **Yes**           No                  **Yes**      **Yes**
 DQN, Rainbow    **Yes**           No                  **Yes**      No
-DDPG            No                **Yes**             **Yes**      No
+DDPG, TD3       No                **Yes**             **Yes**      No
 APEX-DQN        **Yes**           No                  **Yes**      No
 APEX-DDPG       No                **Yes**             **Yes**      No
 ES              **Yes**           **Yes**             No           No

diff --git a/doc/source/rllib.rst b/doc/source/rllib.rst
@@ -54,7 +54,7 @@ Algorithms
 
    -  `Advantage Actor-Critic (A2C, A3C) <rllib-algorithms.html#advantage-actor-critic-a2c-a3c>`__
 
-   -  `Deep Deterministic Policy Gradients (DDPG) <rllib-algorithms.html#deep-deterministic-policy-gradients-ddpg>`__
+   -  `Deep Deterministic Policy Gradients (DDPG, TD3) <rllib-algorithms.html#deep-deterministic-policy-gradients-ddpg-td3>`__
 
    -  `Deep Q Networks (DQN, Rainbow) <rllib-algorithms.html#deep-q-networks-dqn-rainbow>`__
 

diff --git a/python/ray/WebUI.ipynb b/python/ray/WebUI.ipynb
@@ -1,150 +1,97 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Ray UI\n",
-    "\n",
-    "Start the UI with **Kernel -> Restart and Run All**."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "import ray\n",
-    "import ray.experimental.ui as ui\n",
-    "\n",
-    "ray.init(redis_address=os.environ[\"REDIS_ADDRESS\"])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### Object search."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.object_search_bar()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### Task search."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.task_search_bar()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### Task trace timeline."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "To view arrows, go to View Options and select Flow Events."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.task_timeline()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### Task durations."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.task_completion_time_distribution()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### CPU usage."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.cpu_usage()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### Cluster usage."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.cluster_usage()"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.6.1"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+    "cells": [{
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": [
+            "# Ray UI\n", "\n",
+            "Start the UI with **Kernel -> Restart and Run All**."
+        ]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": [
+            "import os\n", "import ray\n",
+            "import ray.experimental.ui as ui\n", "\n",
+            "ray.init(redis_address=os.environ[\"REDIS_ADDRESS\"])"
+        ]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": ["#### Task trace timeline."]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": [
+            "To view arrows, go to View Options and select Flow Events."
+        ]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": ["ui.task_timeline()"]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": ["#### Object transfer timeline."]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": ["ui.object_transfer_timeline()"]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": ["#### Task durations."]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": ["ui.task_completion_time_distribution()"]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": ["#### CPU usage."]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": ["ui.cpu_usage()"]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": ["#### Cluster usage."]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": ["ui.cluster_usage()"]
+    }],
+    "metadata": {
+        "kernelspec": {
+            "display_name": "Python 3",
+            "language": "python",
+            "name": "python3"
+        },
+        "language_info": {
+            "codemirror_mode": {
+                "name": "ipython",
+                "version": 3
+            },
+            "file_extension": ".py",
+            "mimetype": "text/x-python",
+            "name": "python",
+            "nbconvert_exporter": "python",
+            "pygments_lexer": "ipython3",
+            "version": "3.6.1"
+        }
+    },
+    "nbformat": 4,
+    "nbformat_minor": 2
 }
diff --git a/python/ray/autoscaler/autoscaler.py b/python/ray/autoscaler/autoscaler.py
@@ -491,8 +491,10 @@ def files_up_to_date(self, node_id):
     def recover_if_needed(self, node_id):
         if not self.can_update(node_id):
             return
-        last_heartbeat_time = self.load_metrics.last_heartbeat_time_by_ip.get(
-            self.provider.internal_ip(node_id), 0)
+        key = self.provider.internal_ip(node_id)
+        if key not in self.load_metrics.last_heartbeat_time_by_ip:
+            self.load_metrics.last_heartbeat_time_by_ip[key] = time.time()
+        last_heartbeat_time = self.load_metrics.last_heartbeat_time_by_ip[key]
         delta = time.time() - last_heartbeat_time
         if delta < AUTOSCALER_HEARTBEAT_TIMEOUT_S:
             return

diff --git a/python/ray/autoscaler/aws/config.py b/python/ray/autoscaler/aws/config.py
@@ -10,6 +10,7 @@
 
 import boto3
 from botocore.config import Config
+import botocore
 
 from ray.ray_constants import BOTO_MAX_RETRIES
 
@@ -272,7 +273,7 @@ def _get_role(role_name, config):
     try:
         role.load()
         return role
-    except Exception:
+    except botocore.errorfactory.NoSuchEntityException:
         return None
 
 
@@ -282,7 +283,7 @@ def _get_instance_profile(profile_name, config):
     try:
         profile.load()
         return profile
-    except Exception:
+    except botocore.errorfactory.NoSuchEntityException:
         return None