diff --git a/.clang-format b/.clang-format
index c5ab0983b7530..5c0f059e15f3f 100644
--- a/.clang-format
+++ b/.clang-format
@@ -1,6 +1,5 @@
-BasedOnStyle: Chromium
-ColumnLimit: 80
+BasedOnStyle: Google
+ColumnLimit: 90
 DerivePointerAlignment: false
 IndentCaseLabels: false
 PointerAlignment: Right
-SpaceAfterCStyleCast: true
diff --git a/.gitignore b/.gitignore
index abd60923e6314..91189b6f9c41a 100644
--- a/.gitignore
+++ b/.gitignore
@@ -4,26 +4,17 @@
 /python/build
 /python/dist
 /python/flatbuffers-1.7.1/
-/src/common/thirdparty/redis
-/src/thirdparty/arrow
 /flatbuffers-1.7.1/
-/src/thirdparty/boost/
-/src/thirdparty/boost_1_65_1/
-/src/thirdparty/boost_1_60_0/
-/src/thirdparty/catapult/
-/src/thirdparty/flatbuffers/
-/src/thirdparty/parquet-cpp
 /thirdparty/pkg/
 
 # Files generated by flatc should be ignored
-/src/common/format/*.py
-/src/common/format/*_generated.h
-/src/plasma/format/
-/src/local_scheduler/format/*_generated.h
 /src/ray/gcs/format/*_generated.h
 /src/ray/object_manager/format/*_generated.h
 /src/ray/raylet/format/*_generated.h
 
+# Modin source files
+/python/ray/modin
+
 # Redis temporary files
 *dump.rdb
 
@@ -54,9 +45,6 @@ python/.eggs
 *.dylib
 *.dll
 
-# Cython-generated files
-*.c
-
 # Incremental linking files
 *.ilk
 
diff --git a/.travis.yml b/.travis.yml
index 47bef360e51e5..795dff67b6108 100644
--- a/.travis.yml
+++ b/.travis.yml
@@ -53,8 +53,8 @@ matrix:
         - sphinx-build -W -b html -d _build/doctrees source _build/html
         - cd ..
         # Run Python linting, ignore dict vs {} (C408), others are defaults
-        - flake8 --exclude=python/ray/core/src/common/flatbuffers_ep-prefix/,python/ray/core/generated/,src/common/format/,doc/source/conf.py,python/ray/cloudpickle/ --ignore=C408,E121,E123,E126,E226,E24,E704,W503,W504
-        - .travis/yapf.sh --all
+        - flake8 --exclude=python/ray/core/generated/,doc/source/conf.py,python/ray/cloudpickle/ --ignore=C408,E121,E123,E126,E226,E24,E704,W503,W504,W605
+        - .travis/format.sh --all
 
     - os: linux
       dist: trusty
@@ -69,16 +69,9 @@ matrix:
 
       script:
         - cd build
-        - bash ../src/common/test/run_valgrind.sh
-        - bash ../src/plasma/test/run_valgrind.sh
-        - bash ../src/local_scheduler/test/run_valgrind.sh
         - bash ../src/ray/test/run_object_manager_valgrind.sh
         - cd ..
 
-        - python ./python/ray/plasma/test/test.py valgrind
-        - python ./python/ray/local_scheduler/test/test.py valgrind
-        # - python ./python/ray/global_scheduler/test/test.py valgrind
-
     # Build Linux wheels.
     - os: linux
       dist: trusty
@@ -107,63 +100,6 @@ matrix:
       env:
         - PYTHON=3.5
         - RAY_USE_NEW_GCS=on
-        - RAY_USE_XRAY=1
-
-    - os: linux
-      dist: trusty
-      env: PYTHON=3.5 RAY_USE_XRAY=1
-      install:
-        - ./.travis/install-dependencies.sh
-        - export PATH="$HOME/miniconda/bin:$PATH"
-        - ./.travis/install-ray.sh
-        - ./.travis/install-cython-examples.sh
-      script:
-        - export PATH="$HOME/miniconda/bin:$PATH"
-        # The following is needed so cloudpickle can find some of the
-        # class definitions: The main module of tests that are run
-        # with pytest have the same name as the test file -- and this
-        # module is only found if the test directory is in the PYTHONPATH.
-        - export PYTHONPATH="$PYTHONPATH:./test/"
-
-        - python -m pytest -v python/ray/common/test/test.py
-        - python -m pytest -v python/ray/common/redis_module/runtest.py
-        - python -m pytest -v python/ray/plasma/test/test.py
-        # - python -m pytest -v python/ray/local_scheduler/test/test.py
-        # - python -m pytest -v python/ray/global_scheduler/test/test.py
-
-        - python -m pytest -v python/ray/test/test_global_state.py
-        - python -m pytest -v python/ray/test/test_queue.py
-        - python -m pytest -v test/xray_test.py
-
-        - python -m pytest -v test/runtest.py
-        - python -m pytest -v test/array_test.py
-        - python -m pytest -v test/actor_test.py
-        - python -m pytest -v test/autoscaler_test.py
-        - python -m pytest -v test/tensorflow_test.py
-        - python -m pytest -v test/failure_test.py
-        - python -m pytest -v test/microbenchmarks.py
-        - python -m pytest -v test/stress_tests.py
-        - pytest test/component_failures_test.py
-        - python test/multi_node_test.py
-        - python -m pytest -v test/recursion_test.py
-        - pytest test/monitor_test.py
-        - python -m pytest -v test/cython_test.py
-        - python -m pytest -v test/credis_test.py
-
-        # ray tune tests
-        - python python/ray/tune/test/dependency_test.py
-        - python -m pytest -v python/ray/tune/test/trial_runner_test.py
-        - python -m pytest -v python/ray/tune/test/trial_scheduler_test.py
-        - python -m pytest -v python/ray/tune/test/experiment_test.py
-        - python -m pytest -v python/ray/tune/test/tune_server_test.py
-        - python -m pytest -v python/ray/tune/test/ray_trial_executor_test.py
-        - python -m pytest -v python/ray/tune/test/automl_searcher_test.py
-
-        # ray rllib tests
-        - python -m pytest -v python/ray/rllib/test/test_catalog.py
-        - python -m pytest -v python/ray/rllib/test/test_filters.py
-        - python -m pytest -v python/ray/rllib/test/test_optimizers.py
-        - python -m pytest -v python/ray/rllib/test/test_evaluators.py
 
 
 install:
@@ -181,12 +117,10 @@ install:
   - ./src/ray/raylet/lineage_cache_test
   - ./src/ray/raylet/task_dependency_manager_test
   - ./src/ray/raylet/reconstruction_policy_test
+  - ./src/ray/raylet/client_connection_test
   - ./src/ray/util/logging_test --gtest_filter=PrintLogTest*
   - ./src/ray/util/signal_test
 
-  - bash ../src/common/test/run_tests.sh
-  - bash ../src/plasma/test/run_tests.sh
-  - bash ../src/local_scheduler/test/run_tests.sh
   - cd ..
 
 script:
@@ -197,14 +131,27 @@ script:
   # module is only found if the test directory is in the PYTHONPATH.
   - export PYTHONPATH="$PYTHONPATH:./test/"
 
-  - python -m pytest -v python/ray/common/test/test.py
-  - python -m pytest -v python/ray/common/redis_module/runtest.py
-  - python -m pytest -v python/ray/plasma/test/test.py
-  - python -m pytest -v python/ray/local_scheduler/test/test.py
-  - python -m pytest -v python/ray/global_scheduler/test/test.py
+  # ray tune tests
+  - python python/ray/tune/test/dependency_test.py
+  - python -m pytest -v python/ray/tune/test/trial_runner_test.py
+  - python -m pytest -v python/ray/tune/test/trial_scheduler_test.py
+  - python -m pytest -v python/ray/tune/test/experiment_test.py
+  - python -m pytest -v python/ray/tune/test/tune_server_test.py
+  - python -m pytest -v python/ray/tune/test/ray_trial_executor_test.py
+  - python -m pytest -v python/ray/tune/test/automl_searcher_test.py
+
+  # ray rllib tests
+  - python -m pytest -v python/ray/rllib/test/test_catalog.py
+  - python -m pytest -v python/ray/rllib/test/test_filters.py
+  - python -m pytest -v python/ray/rllib/test/test_optimizers.py
+  - python -m pytest -v python/ray/rllib/test/test_evaluators.py
+
+  # Python3.5+ only. Otherwise we will get `SyntaxError` regardless of how we set the tester.
+  - python -c 'import sys;exit(sys.version_info>=(3,5))' || python -m pytest -v python/ray/experimental/test/async_test.py
 
   - python -m pytest -v python/ray/test/test_global_state.py
   - python -m pytest -v python/ray/test/test_queue.py
+  - python -m pytest -v python/ray/test/test_ray_init.py
   - python -m pytest -v test/xray_test.py
 
   - python -m pytest -v test/runtest.py
@@ -216,26 +163,19 @@ script:
   - python -m pytest -v test/microbenchmarks.py
   - python -m pytest -v test/stress_tests.py
   - python -m pytest -v test/component_failures_test.py
-  - python test/multi_node_test.py
+  - python -m pytest -v test/multi_node_test.py
+  - python -m pytest -v test/multi_node_test_2.py
   - python -m pytest -v test/recursion_test.py
   - python -m pytest -v test/monitor_test.py
   - python -m pytest -v test/cython_test.py
   - python -m pytest -v test/credis_test.py
+  - python -m pytest -v test/node_manager_test.py
 
-  # ray tune tests
-  - python python/ray/tune/test/dependency_test.py
-  - python -m pytest -v python/ray/tune/test/trial_runner_test.py
-  - python -m pytest -v python/ray/tune/test/trial_scheduler_test.py
-  - python -m pytest -v python/ray/tune/test/experiment_test.py
-  - python -m pytest -v python/ray/tune/test/tune_server_test.py
-  - python -m pytest -v python/ray/tune/test/ray_trial_executor_test.py
-  - python -m pytest -v python/ray/tune/test/automl_searcher_test.py
+  # ray temp file tests
+  - python -m pytest -v test/tempfile_test.py
 
-  # ray rllib tests
-  - python -m pytest -v python/ray/rllib/test/test_catalog.py
-  - python -m pytest -v python/ray/rllib/test/test_filters.py
-  - python -m pytest -v python/ray/rllib/test/test_optimizers.py
-  - python -m pytest -v python/ray/rllib/test/test_evaluators.py
+  # modin test files
+  - python python/ray/test/test_modin.py
 
 deploy:
   - provider: s3
diff --git a/.travis/yapf.sh b/.travis/format.sh
similarity index 74%
rename from .travis/yapf.sh
rename to .travis/format.sh
index d90aec89531d2..9313e641065a8 100755
--- a/.travis/yapf.sh
+++ b/.travis/format.sh
@@ -1,4 +1,6 @@
 #!/usr/bin/env bash
+# YAPF + Clang formatter (if installed). This script formats all changed files from the last mergebase.
+# You are encouraged to run this locally before pushing changes for review.
 
 # Cause the script to exit if a single command fails
 set -eo pipefail
@@ -28,7 +30,6 @@ YAPF_EXCLUDES=(
     '--exclude' 'python/build/*'
     '--exclude' 'python/ray/pyarrow_files/*'
     '--exclude' 'python/ray/core/src/ray/gcs/*'
-    '--exclude' 'python/ray/common/thirdparty/*'
 )
 
 # Format specified files
@@ -50,6 +51,18 @@ format_changed() {
     if ! git diff --diff-filter=ACM --quiet --exit-code "$MERGEBASE" -- '*.py' &>/dev/null; then
         git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.py' | xargs -P 5 \
              yapf --in-place "${YAPF_EXCLUDES[@]}" "${YAPF_FLAGS[@]}"
+        if which flake8 >/dev/null; then
+            git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.py' | xargs -P 5 \
+                 flake8 --exclude=python/ray/core/generated/,doc/source/conf.py,python/ray/cloudpickle/ \
+                    --ignore=C408,E121,E123,E126,E226,E24,E704,W503,W504,W605
+        fi
+    fi
+
+    if which clang-format >/dev/null; then
+        if ! git diff --diff-filter=ACM --quiet --exit-code "$MERGEBASE" -- '*.cc' '*.h' &>/dev/null; then
+            git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.cc' '*.h' | xargs -P 5 \
+                 clang-format -i
+        fi
     fi
 }
 
diff --git a/.travis/install-dependencies.sh b/.travis/install-dependencies.sh
index 1c6c3a342a616..5bae4ba87f8db 100755
--- a/.travis/install-dependencies.sh
+++ b/.travis/install-dependencies.sh
@@ -24,8 +24,8 @@ if [[ "$PYTHON" == "2.7" ]] && [[ "$platform" == "linux" ]]; then
   wget https://repo.continuum.io/miniconda/Miniconda2-4.5.4-Linux-x86_64.sh -O miniconda.sh -nv
   bash miniconda.sh -b -p $HOME/miniconda
   export PATH="$HOME/miniconda/bin:$PATH"
-  pip install -q cython==0.27.3 cmake tensorflow gym opencv-python pyyaml pandas==0.22 requests \
-    feather-format lxml openpyxl xlrd
+  pip install -q cython==0.27.3 cmake tensorflow gym opencv-python pyyaml pandas==0.23.4 requests \
+    feather-format lxml openpyxl xlrd py-spy setproctitle faulthandler pytest-timeout mock
 elif [[ "$PYTHON" == "3.5" ]] && [[ "$platform" == "linux" ]]; then
   sudo apt-get update
   sudo apt-get install -y cmake pkg-config python-dev python-numpy build-essential autoconf curl libtool unzip
@@ -33,8 +33,8 @@ elif [[ "$PYTHON" == "3.5" ]] && [[ "$platform" == "linux" ]]; then
   wget https://repo.continuum.io/miniconda/Miniconda3-4.5.4-Linux-x86_64.sh -O miniconda.sh -nv
   bash miniconda.sh -b -p $HOME/miniconda
   export PATH="$HOME/miniconda/bin:$PATH"
-  pip install -q cython==0.27.3 cmake tensorflow gym opencv-python pyyaml pandas==0.22 requests \
-    feather-format lxml openpyxl xlrd
+  pip install -q cython==0.27.3 cmake tensorflow gym opencv-python pyyaml pandas==0.23.4 requests \
+    feather-format lxml openpyxl xlrd py-spy setproctitle pytest-timeout
 elif [[ "$PYTHON" == "2.7" ]] && [[ "$platform" == "macosx" ]]; then
   # check that brew is installed
   which -s brew
@@ -50,8 +50,8 @@ elif [[ "$PYTHON" == "2.7" ]] && [[ "$platform" == "macosx" ]]; then
   wget https://repo.continuum.io/miniconda/Miniconda2-4.5.4-MacOSX-x86_64.sh -O miniconda.sh -nv
   bash miniconda.sh -b -p $HOME/miniconda
   export PATH="$HOME/miniconda/bin:$PATH"
-  pip install -q cython==0.27.3 cmake tensorflow gym opencv-python pyyaml pandas==0.22 requests \
-    feather-format lxml openpyxl xlrd
+  pip install -q cython==0.27.3 cmake tensorflow gym opencv-python pyyaml pandas==0.23.4 requests \
+    feather-format lxml openpyxl xlrd py-spy setproctitle faulthandler pytest-timeout mock
 elif [[ "$PYTHON" == "3.5" ]] && [[ "$platform" == "macosx" ]]; then
   # check that brew is installed
   which -s brew
@@ -67,8 +67,8 @@ elif [[ "$PYTHON" == "3.5" ]] && [[ "$platform" == "macosx" ]]; then
   wget https://repo.continuum.io/miniconda/Miniconda3-4.5.4-MacOSX-x86_64.sh -O miniconda.sh -nv
   bash miniconda.sh -b -p $HOME/miniconda
   export PATH="$HOME/miniconda/bin:$PATH"
-  pip install -q cython==0.27.3 cmake tensorflow gym opencv-python pyyaml pandas==0.22 requests \
-    feather-format lxml openpyxl xlrd
+  pip install -q cython==0.27.3 cmake tensorflow gym opencv-python pyyaml pandas==0.23.4 requests \
+    feather-format lxml openpyxl xlrd py-spy setproctitle pytest-timeout
 elif [[ "$LINT" == "1" ]]; then
   sudo apt-get update
   sudo apt-get install -y cmake build-essential autoconf curl libtool unzip
diff --git a/.travis/test-wheels.sh b/.travis/test-wheels.sh
index 1b77209c3ddc7..f7870ea52d496 100755
--- a/.travis/test-wheels.sh
+++ b/.travis/test-wheels.sh
@@ -56,10 +56,10 @@ if [[ "$platform" == "linux" ]]; then
 
   # Check that the other wheels are present.
   NUMBER_OF_WHEELS=$(ls -1q $ROOT_DIR/../.whl/*.whl | wc -l)
-  if [[ "$NUMBER_OF_WHEELS" != "4" ]]; then
+  if [[ "$NUMBER_OF_WHEELS" != "5" ]]; then
     echo "Wrong number of wheels found."
     ls -l $ROOT_DIR/../.whl/
-    exit 1
+    exit 2
   fi
 
 elif [[ "$platform" == "macosx" ]]; then
@@ -67,12 +67,14 @@ elif [[ "$platform" == "macosx" ]]; then
   PY_MMS=("2.7"
           "3.4"
           "3.5"
-          "3.6")
+          "3.6"
+          "3.7")
   # This array is just used to find the right wheel.
   PY_WHEEL_VERSIONS=("27"
                      "34"
                      "35"
-                     "36")
+                     "36"
+                     "37")
 
   for ((i=0; i<${#PY_MMS[@]}; ++i)); do
     PY_MM=${PY_MMS[i]}
@@ -92,5 +94,5 @@ elif [[ "$platform" == "macosx" ]]; then
   done
 else
   echo "Unrecognized environment."
-  exit 1
+  exit 3
 fi
diff --git a/CMakeLists.txt b/CMakeLists.txt
index d02e88a5c4203..a6734e62ce144 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -82,18 +82,15 @@ include_directories(SYSTEM ${PLASMA_INCLUDE_DIR})
 include_directories("${CMAKE_CURRENT_LIST_DIR}/src/")
 
 add_subdirectory(${CMAKE_CURRENT_LIST_DIR}/src/ray/)
-add_subdirectory(${CMAKE_CURRENT_LIST_DIR}/src/common/)
-add_subdirectory(${CMAKE_CURRENT_LIST_DIR}/src/plasma/)
-add_subdirectory(${CMAKE_CURRENT_LIST_DIR}/src/local_scheduler/)
-add_subdirectory(${CMAKE_CURRENT_LIST_DIR}/src/global_scheduler/)
 
 # final target copy_ray
 add_custom_target(copy_ray ALL)
 
 # copy plasma_store_server
 add_custom_command(TARGET copy_ray POST_BUILD
+  COMMAND mkdir -p ${CMAKE_CURRENT_BINARY_DIR}/src/plasma
   COMMAND ${CMAKE_COMMAND} -E
-    copy ${ARROW_HOME}/bin/plasma_store_server ${CMAKE_CURRENT_BINARY_DIR}/src/plasma)
+    copy ${ARROW_HOME}/bin/plasma_store_server ${CMAKE_CURRENT_BINARY_DIR}/src/plasma/)
 
 if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
   # add pyarrow as the dependency
@@ -102,12 +99,9 @@ if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
   # NOTE: The lists below must be kept in sync with ray/python/setup.py.
 
   set(ray_file_list
-        "src/common/thirdparty/redis/src/redis-server"
-        "src/common/redis_module/libray_redis_module.so"
-        "src/plasma/plasma_manager"
-        "src/local_scheduler/local_scheduler"
-        "src/local_scheduler/liblocal_scheduler_library_python.so"
-        "src/global_scheduler/global_scheduler"
+        "src/ray/thirdparty/redis/src/redis-server"
+        "src/ray/gcs/redis_module/libray_redis_module.so"
+        "src/ray/raylet/liblocal_scheduler_library_python.so"
         "src/ray/raylet/raylet_monitor"
         "src/ray/raylet/raylet")
 
@@ -117,7 +111,10 @@ if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
     list(APPEND ray_file_list "src/credis/redis/src/redis-server")
   endif()
 
-  if (DEFINED ENV{INCLUDE_UI} AND "$ENV{INCLUDE_UI}" STREQUAL "1")
+  # The goal of the if statement below is to require the catapult files to be
+  # present INCLUDE_UI=1 is set and to include the UI files if they are present.
+  # This should match the logic in build_ui.sh.
+  if (EXISTS "${CMAKE_BINARY_DIR}/src/catapult_files/index.html" OR "$ENV{INCLUDE_UI}" STREQUAL "1")
     list(APPEND ray_file_list "src/catapult_files/index.html")
     list(APPEND ray_file_list "src/catapult_files/trace_viewer_full.html")
   endif()
@@ -154,5 +151,6 @@ if ("${CMAKE_RAY_LANG_JAVA}" STREQUAL "YES")
 
   # copy libplasma_java files
   add_custom_command(TARGET copy_ray POST_BUILD
-    COMMAND bash -c "cp ${ARROW_LIBRARY_DIR}/libplasma_java.* ${CMAKE_CURRENT_BINARY_DIR}/src/plasma")
+    COMMAND bash -c "mkdir -p ${CMAKE_CURRENT_BINARY_DIR}/src/plasma"
+    COMMAND bash -c "cp ${ARROW_LIBRARY_DIR}/libplasma_java.* ${CMAKE_CURRENT_BINARY_DIR}/src/plasma/")
 endif()
diff --git a/README.rst b/README.rst
index 356ef60ebf6f9..5fd892f95f037 100644
--- a/README.rst
+++ b/README.rst
@@ -1,5 +1,6 @@
-Ray
-===
+.. raw:: html
+
+    <a href=http://ray.readthedocs.io/en/latest/index.html><img align="right" width="30%" src="https://github.com/devin-petersohn/ray/raw/docs/update_readme/doc/source/images/ray_logo.png"></a>
 
 .. image:: https://travis-ci.com/ray-project/ray.svg?branch=master
     :target: https://travis-ci.com/ray-project/ray
@@ -7,9 +8,12 @@ Ray
 .. image:: https://readthedocs.org/projects/ray/badge/?version=latest
     :target: http://ray.readthedocs.io/en/latest/?badge=latest
 
+.. image:: https://img.shields.io/badge/pypi-0.6.0-blue.svg
+    :target: https://pypi.org/project/ray/
+
 |
 
-Ray is a flexible, high-performance distributed execution framework.
+**Ray is a flexible, high-performance distributed execution framework.**
 
 
 Ray is easy to install: ``pip install ray``
@@ -37,11 +41,12 @@ Example Use
 
 Ray comes with libraries that accelerate deep learning and reinforcement learning development:
 
-- `Ray Tune`_: Hyperparameter Optimization Framework
-- `Ray RLlib`_: Scalable Reinforcement Learning
+- `Tune`_: Hyperparameter Optimization Framework
+- `RLlib`_: Scalable Reinforcement Learning
+- `Distributed Training <http://ray.readthedocs.io/en/latest/distributed_sgd.html>`__
 
-.. _`Ray Tune`: http://ray.readthedocs.io/en/latest/tune.html
-.. _`Ray RLlib`: http://ray.readthedocs.io/en/latest/rllib.html
+.. _`Tune`: http://ray.readthedocs.io/en/latest/tune.html
+.. _`RLlib`: http://ray.readthedocs.io/en/latest/rllib.html
 
 Installation
 ------------
diff --git a/build.sh b/build.sh
index 496bbdddb5750..6aa695b83a924 100755
--- a/build.sh
+++ b/build.sh
@@ -25,7 +25,7 @@ function usage()
 # Determine how many parallel jobs to use for make based on the number of cores
 unamestr="$(uname)"
 if [[ "$unamestr" == "Linux" ]]; then
-  PARALLEL=$(nproc)
+  PARALLEL=$(nproc --all)
 elif [[ "$unamestr" == "Darwin" ]]; then
   PARALLEL=$(sysctl -n hw.ncpu)
 else
@@ -101,12 +101,16 @@ fi
 
 pushd "$BUILD_DIR"
 
+# avoid the command failed and exits
+# and cmake will check some directories to determine whether some targets built
+make clean || true
+rm -rf external/arrow-install
+
 cmake -DCMAKE_BUILD_TYPE=$CBUILD_TYPE \
       -DCMAKE_RAY_LANG_JAVA=$RAY_BUILD_JAVA \
       -DCMAKE_RAY_LANG_PYTHON=$RAY_BUILD_PYTHON \
       -DRAY_USE_NEW_GCS=$RAY_USE_NEW_GCS \
       -DPYTHON_EXECUTABLE:FILEPATH=$PYTHON_EXECUTABLE $ROOT_DIR
 
-make clean
 make -j${PARALLEL}
 popd
diff --git a/cmake/Modules/ArrowExternalProject.cmake b/cmake/Modules/ArrowExternalProject.cmake
index dfb25f244f9a2..3e19dfbd2672f 100644
--- a/cmake/Modules/ArrowExternalProject.cmake
+++ b/cmake/Modules/ArrowExternalProject.cmake
@@ -9,25 +9,21 @@
 #  - ARROW_INCLUDE_DIR
 #  - ARROW_SHARED_LIB
 #  - ARROW_STATIC_LIB
+#  - ARROW_LIBRARY_DIR
 #  - PLASMA_INCLUDE_DIR
 #  - PLASMA_STATIC_LIB
 #  - PLASMA_SHARED_LIB
 
 set(arrow_URL https://github.com/apache/arrow.git)
-# The PR for this commit is https://github.com/apache/arrow/pull/2522. We
+# The PR for this commit is https://github.com/apache/arrow/pull/3093. We
 # include the link here to make it easier to find the right commit because
 # Arrow often rewrites git history and invalidates certain commits.
-set(arrow_TAG 7104d64ff2cd6c20e29d3cf4ec5c58bc10798f66)
+set(arrow_TAG 187b98ed338d4995317dae9efd19870c532192cb)
 
 set(ARROW_INSTALL_PREFIX ${CMAKE_CURRENT_BINARY_DIR}/external/arrow-install)
 set(ARROW_HOME ${ARROW_INSTALL_PREFIX})
 set(ARROW_SOURCE_DIR ${CMAKE_CURRENT_BINARY_DIR}/external/arrow/src/arrow_ep)
 
-# The following is needed because in CentOS, the lib directory is named lib64
-if(EXISTS "/etc/redhat-release" AND CMAKE_SIZEOF_VOID_P EQUAL 8)
-  set(LIB_SUFFIX 64)
-endif()
-
 set(ARROW_INCLUDE_DIR ${ARROW_HOME}/include)
 set(ARROW_LIBRARY_DIR ${ARROW_HOME}/lib${LIB_SUFFIX})
 set(ARROW_SHARED_LIB ${ARROW_LIBRARY_DIR}/libarrow${CMAKE_SHARED_LIBRARY_SUFFIX})
@@ -58,7 +54,8 @@ set(ARROW_CMAKE_ARGS
   -DARROW_WITH_LZ4=off
   -DARROW_WITH_ZSTD=off
   -DFLATBUFFERS_HOME=${FLATBUFFERS_HOME}
-  -DBOOST_ROOT=${BOOST_ROOT})
+  -DBOOST_ROOT=${BOOST_ROOT}
+  -DGLOG_HOME=${GLOG_HOME})
 
 if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
   # PyArrow needs following settings.
@@ -92,19 +89,24 @@ endif()
 
 ExternalProject_Add(arrow_ep
   PREFIX external/arrow
-  DEPENDS flatbuffers boost
+  DEPENDS flatbuffers boost glog
   GIT_REPOSITORY ${arrow_URL}
   GIT_TAG ${arrow_TAG}
+  UPDATE_COMMAND ""
   ${ARROW_CONFIGURE}
   BUILD_BYPRODUCTS "${ARROW_SHARED_LIB}" "${ARROW_STATIC_LIB}")
 
 if ("${CMAKE_RAY_LANG_JAVA}" STREQUAL "YES")
-  ExternalProject_Add_Step(arrow_ep arrow_ep_install_java_lib
-    COMMAND bash -c "cd ${ARROW_SOURCE_DIR}/java && mvn clean install -pl plasma -am -Dmaven.test.skip > /dev/null"
-    DEPENDEES build)
+  set_property(DIRECTORY APPEND PROPERTY ADDITIONAL_MAKE_CLEAN_FILES "${ARROW_SOURCE_DIR}/java/target/")
+
+  if(NOT EXISTS ${ARROW_SOURCE_DIR}/java/target/)
+    ExternalProject_Add_Step(arrow_ep arrow_ep_install_java_lib
+      COMMAND bash -c "cd ${ARROW_SOURCE_DIR}/java && mvn clean install -pl plasma -am -Dmaven.test.skip > /dev/null"
+      DEPENDEES build)
+  endif()
 
   # add install of library plasma_java, it is not configured in plasma CMakeLists.txt
   ExternalProject_Add_Step(arrow_ep arrow_ep_install_plasma_java
-    COMMAND bash -c "cp ${CMAKE_CURRENT_BINARY_DIR}/external/arrow/src/arrow_ep-build/release/libplasma_java.* ${ARROW_LIBRARY_DIR}/"
+    COMMAND bash -c "cp -rf ${CMAKE_CURRENT_BINARY_DIR}/external/arrow/src/arrow_ep-build/release/libplasma_java.* ${ARROW_LIBRARY_DIR}/"
     DEPENDEES install)
 endif ()
diff --git a/cmake/Modules/BoostExternalProject.cmake b/cmake/Modules/BoostExternalProject.cmake
index bab016a02b7a3..1fbbb0c0b58ef 100644
--- a/cmake/Modules/BoostExternalProject.cmake
+++ b/cmake/Modules/BoostExternalProject.cmake
@@ -9,9 +9,9 @@
 
 # boost is a stable library in ray, and it supports to find
 # the boost pre-built in environment to speed up build process
-if (DEFINED ENV{BOOST_ROOT} AND EXISTS ENV{BOOST_ROOT})
+if (DEFINED ENV{RAY_BOOST_ROOT} AND EXISTS $ENV{RAY_BOOST_ROOT})
   set(Boost_USE_STATIC_LIBS ON)
-  set(BOOST_ROOT "$ENV{BOOST_ROOT}")
+  set(BOOST_ROOT "$ENV{RAY_BOOST_ROOT}")
   message(STATUS "Find BOOST_ROOT: ${BOOST_ROOT}")
 #  find_package(Boost COMPONENTS system filesystem REQUIRED)
   set(Boost_INCLUDE_DIR ${BOOST_ROOT}/include)
diff --git a/cmake/Modules/Common.cmake b/cmake/Modules/Common.cmake
index cc2a5d5ff9926..7d33f13e9d450 100644
--- a/cmake/Modules/Common.cmake
+++ b/cmake/Modules/Common.cmake
@@ -41,6 +41,3 @@ if ("${CMAKE_RAY_LANG_JAVA}" STREQUAL "YES")
     message (WARNING "NOT FIND JNI")
   endif()
 endif()
-
-include_directories(${CMAKE_SOURCE_DIR}/src/common)
-include_directories(${CMAKE_SOURCE_DIR}/src/common/thirdparty)
diff --git a/cmake/Modules/FlatBuffersExternalProject.cmake b/cmake/Modules/FlatBuffersExternalProject.cmake
index 57c2216cecfb7..508010afced49 100644
--- a/cmake/Modules/FlatBuffersExternalProject.cmake
+++ b/cmake/Modules/FlatBuffersExternalProject.cmake
@@ -10,13 +10,8 @@
 #  - FLATBUFFERS_COMPILER
 #  - FBS_DEPENDS, to keep compatible
 
-# The following is needed because in CentOS, the lib directory is named lib64
-if(EXISTS "/etc/redhat-release" AND CMAKE_SIZEOF_VOID_P EQUAL 8)
-  set(LIB_SUFFIX 64)
-endif()
-
-if(DEFINED ENV{FLATBUFFERS_HOME} AND EXISTS ENV{FLATBUFFERS_HOME})
-  set(FLATBUFFERS_HOME "$ENV{FLATBUFFERS_HOME}")
+if(DEFINED ENV{RAY_FLATBUFFERS_HOME} AND EXISTS $ENV{RAY_FLATBUFFERS_HOME})
+  set(FLATBUFFERS_HOME "$ENV{RAY_FLATBUFFERS_HOME}")
   set(FLATBUFFERS_INCLUDE_DIR "${FLATBUFFERS_HOME}/include")
   set(FLATBUFFERS_STATIC_LIB "${FLATBUFFERS_HOME}/lib${LIB_SUFFIX}/libflatbuffers.a")
   set(FLATBUFFERS_COMPILER "${FLATBUFFERS_HOME}/bin/flatc")
diff --git a/cmake/Modules/GlogExternalProject.cmake b/cmake/Modules/GlogExternalProject.cmake
index 47f11fbdbd6ad..2900bae4d523b 100644
--- a/cmake/Modules/GlogExternalProject.cmake
+++ b/cmake/Modules/GlogExternalProject.cmake
@@ -6,8 +6,8 @@
 #  - GLOG_INCLUDE_DIR
 #  - GLOG_STATIC_LIB
 
-if(DEFINED ENV{GLOG_HOME} AND EXISTS ENV{GLOG_HOME})
-  set(GLOG_HOME "$ENV{GLOG_HOME}")
+if(DEFINED ENV{RAY_GLOG_HOME} AND EXISTS $ENV{RAY_GLOG_HOME})
+  set(GLOG_HOME "$ENV{RAY_GLOG_HOME}")
   set(GLOG_INCLUDE_DIR "${GLOG_HOME}/include")
   set(GLOG_STATIC_LIB "${GLOG_HOME}/lib/libglog.a")
 
@@ -23,7 +23,7 @@ else()
   endif()
 
   set(GLOG_URL "https://github.com/google/glog/archive/v${GLOG_VERSION}.tar.gz")
-  set(GLOG_PREFIX "${CMAKE_CURRENT_BINARY_DIR}/external/glog/src/glog_ep")
+  set(GLOG_PREFIX "${CMAKE_CURRENT_BINARY_DIR}/external/glog-install")
   set(GLOG_HOME "${GLOG_PREFIX}")
   set(GLOG_INCLUDE_DIR "${GLOG_PREFIX}/include")
   set(GLOG_STATIC_LIB "${GLOG_PREFIX}/lib/libglog.a")
diff --git a/cmake/Modules/GtestExternalProject.cmake b/cmake/Modules/GtestExternalProject.cmake
index 5570066c60fbb..66e5a76f1d87e 100644
--- a/cmake/Modules/GtestExternalProject.cmake
+++ b/cmake/Modules/GtestExternalProject.cmake
@@ -7,18 +7,31 @@
 #  - GTEST_MAIN_STATIC_LIB
 #  - GMOCK_MAIN_STATIC_LIB
 
-if(DEFINED ENV{GTEST_HOME} AND EXISTS ENV{GTEST_HOME})
-  set(GTEST_HOME "$ENV{GTEST_HOME}")
-  set(GTEST_INCLUDE_DIR "${GTEST_HOME}/include")
-  set(GTEST_STATIC_LIB
-    "${GTEST_HOME}/lib/${CMAKE_STATIC_LIBRARY_PREFIX}gtest${CMAKE_STATIC_LIBRARY_SUFFIX}")
-  set(GTEST_MAIN_STATIC_LIB
-    "${GTEST_HOME}/lib/${CMAKE_STATIC_LIBRARY_PREFIX}gtest_main${CMAKE_STATIC_LIBRARY_SUFFIX}")
-  set(GMOCK_MAIN_STATIC_LIB
-    "${GTEST_HOME}/lib/${CMAKE_STATIC_LIBRARY_PREFIX}gmock_main${CMAKE_STATIC_LIBRARY_SUFFIX}")
+set(GTEST_FOUND FALSE)
+
+if(DEFINED ENV{RAY_GTEST_HOME} AND EXISTS $ENV{RAY_GTEST_HOME})
+  set(GTEST_HOME "$ENV{RAY_GTEST_HOME}")
+  find_path(GTEST_INCLUDE_DIR NAMES gtest/gtest.h
+    PATHS ${GTEST_HOME} NO_DEFAULT_PATH
+    PATH_SUFFIXES "include")
+  find_library(GTEST_LIBRARIES NAMES gtest gtest_main gmock_main
+    PATHS ${GTEST_HOME} NO_DEFAULT_PATH
+    PATH_SUFFIXES "lib")
+  if(GTEST_INCLUDE_DIR AND GTEST_LIBRARIES)
+    set(GTEST_FOUND TRUE)
+    set(GTEST_STATIC_LIB
+      "${GTEST_HOME}/lib/${CMAKE_STATIC_LIBRARY_PREFIX}gtest${CMAKE_STATIC_LIBRARY_SUFFIX}")
+    set(GTEST_MAIN_STATIC_LIB
+      "${GTEST_HOME}/lib/${CMAKE_STATIC_LIBRARY_PREFIX}gtest_main${CMAKE_STATIC_LIBRARY_SUFFIX}")
+    set(GMOCK_MAIN_STATIC_LIB
+      "${GTEST_HOME}/lib/${CMAKE_STATIC_LIBRARY_PREFIX}gmock_main${CMAKE_STATIC_LIBRARY_SUFFIX}")
+
+    add_custom_target(googletest_ep)
+  endif()
+
+endif()
 
-  add_custom_target(googletest_ep)
-else()
+if(NOT GTEST_FOUND)
   set(GTEST_VERSION "1.8.0")
 
   if(APPLE)
@@ -31,7 +44,7 @@ else()
   endif()
   set(GTEST_CMAKE_CXX_FLAGS "${EP_CXX_FLAGS} ${CMAKE_CXX_FLAGS_${UPPERCASE_BUILD_TYPE}} ${GTEST_CMAKE_CXX_FLAGS}")
 
-  set(GTEST_PREFIX "${CMAKE_CURRENT_BINARY_DIR}/external/googletest/src/googletest_ep")
+  set(GTEST_PREFIX "${CMAKE_CURRENT_BINARY_DIR}/external/googletest-install")
   set(GTEST_INCLUDE_DIR "${GTEST_PREFIX}/include")
   set(GTEST_STATIC_LIB
     "${GTEST_PREFIX}/lib/${CMAKE_STATIC_LIBRARY_PREFIX}gtest${CMAKE_STATIC_LIBRARY_SUFFIX}")
diff --git a/cmake/Modules/ThirdpartyToolchain.cmake b/cmake/Modules/ThirdpartyToolchain.cmake
index 0e0553483ec23..723b3cd6aa001 100644
--- a/cmake/Modules/ThirdpartyToolchain.cmake
+++ b/cmake/Modules/ThirdpartyToolchain.cmake
@@ -4,6 +4,11 @@
 # we have to turn it on for dependencies too
 set(EP_CXX_FLAGS "${EP_CXX_FLAGS} -D_GLIBCXX_USE_CXX11_ABI=0")
 
+# The following is needed because in CentOS, the lib directory is named lib64
+if(EXISTS "/etc/redhat-release" AND CMAKE_SIZEOF_VOID_P EQUAL 8)
+  set(LIB_SUFFIX 64)
+endif()
+
 if(RAY_BUILD_TESTS OR RAY_BUILD_BENCHMARKS)
   add_custom_target(unittest ctest -L unittest)
 
@@ -25,18 +30,16 @@ if(RAY_BUILD_TESTS OR RAY_BUILD_BENCHMARKS)
   add_dependencies(gmock_main googletest_ep)
 endif()
 
-if(RAY_USE_GLOG)
-  include(GlogExternalProject)
-  message(STATUS "Glog home: ${GLOG_HOME}")
-  message(STATUS "Glog include dir: ${GLOG_INCLUDE_DIR}")
-  message(STATUS "Glog static lib: ${GLOG_STATIC_LIB}")
+include(GlogExternalProject)
+message(STATUS "Glog home: ${GLOG_HOME}")
+message(STATUS "Glog include dir: ${GLOG_INCLUDE_DIR}")
+message(STATUS "Glog static lib: ${GLOG_STATIC_LIB}")
 
-  include_directories(${GLOG_INCLUDE_DIR})
-  ADD_THIRDPARTY_LIB(glog
-    STATIC_LIB ${GLOG_STATIC_LIB})
+include_directories(${GLOG_INCLUDE_DIR})
+ADD_THIRDPARTY_LIB(glog
+  STATIC_LIB ${GLOG_STATIC_LIB})
 
-  add_dependencies(glog glog_ep)
-endif()
+add_dependencies(glog glog_ep)
 
 # boost
 include(BoostExternalProject)
@@ -95,19 +98,6 @@ ADD_THIRDPARTY_LIB(plasma STATIC_LIB ${PLASMA_STATIC_LIB})
 add_dependencies(plasma plasma_ep)
 
 if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
-  # pyarrow
-  find_package(PythonInterp REQUIRED)
-  message(STATUS "PYTHON_EXECUTABLE for pyarrow: ${PYTHON_EXECUTABLE}")
-
-  set(pyarrow_ENV
-    "PKG_CONFIG_PATH=${ARROW_LIBRARY_DIR}/pkgconfig"
-    "PYARROW_WITH_PLASMA=1"
-    "PYARROW_WITH_TENSORFLOW=1"
-    "PYARROW_BUNDLE_ARROW_CPP=1"
-    "PARQUET_HOME=${PARQUET_HOME}"
-    "PYARROW_WITH_PARQUET=1"
-  )
-
   # clean the arrow_ep/python/build/lib.xxxxx directory,
   # or when you build with another python version, it creates multiple lib.xxxx directories
   set_property(DIRECTORY APPEND PROPERTY ADDITIONAL_MAKE_CLEAN_FILES "${ARROW_SOURCE_DIR}/python/build/")
@@ -115,13 +105,40 @@ if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
 
   # here we use externalProject to process pyarrow building
   # add_custom_command would have problem with setup.py
-  ExternalProject_Add(pyarrow_ext
-    PREFIX external/pyarrow
-    DEPENDS arrow_ep
-    DOWNLOAD_COMMAND ""
-    BUILD_IN_SOURCE 1
-    CONFIGURE_COMMAND cd ${ARROW_SOURCE_DIR}/python && ${CMAKE_COMMAND} -E env ${pyarrow_ENV} ${PYTHON_EXECUTABLE} setup.py build
-    BUILD_COMMAND cd ${ARROW_SOURCE_DIR}/python && ${CMAKE_COMMAND} -E env ${pyarrow_ENV} ${PYTHON_EXECUTABLE} setup.py build_ext
-    INSTALL_COMMAND bash -c "cp -rf \$(find ${ARROW_SOURCE_DIR}/python/build/ -maxdepth 1 -type d -print | grep -m1 'lib')/pyarrow ${CMAKE_SOURCE_DIR}/python/ray/pyarrow_files/")
+  if(EXISTS ${ARROW_SOURCE_DIR}/python/build/)
+    # if we did not run `make clean`, skip the rebuild of pyarrow
+    add_custom_target(pyarrow_ext)
+  else()
+    # pyarrow
+    find_package(PythonInterp REQUIRED)
+    message(STATUS "PYTHON_EXECUTABLE for pyarrow: ${PYTHON_EXECUTABLE}")
+
+    # PYARROW_PARALLEL= , so it will add -j to pyarrow build
+    set(pyarrow_ENV
+      "PKG_CONFIG_PATH=${ARROW_LIBRARY_DIR}/pkgconfig"
+      "PYARROW_WITH_PLASMA=1"
+      "PYARROW_WITH_TENSORFLOW=1"
+      "PYARROW_BUNDLE_ARROW_CPP=1"
+      "PARQUET_HOME=${PARQUET_HOME}"
+      "PYARROW_WITH_PARQUET=1"
+      "PYARROW_PARALLEL=")
+
+    if (APPLE)
+      # Since 10.14, the XCode toolchain only accepts libc++ as the
+      # standard library. This should also work on macOS starting from 10.9.
+      set(pyarrow_ENV ${pyarrow_ENV} "CXXFLAGS='-stdlib=libc++'")
+      set(pyarrow_ENV ${pyarrow_ENV} "MACOSX_DEPLOYMENT_TARGET=10.7")
+    endif()
+
+    ExternalProject_Add(pyarrow_ext
+      PREFIX external/pyarrow
+      DEPENDS arrow_ep
+      DOWNLOAD_COMMAND ""
+      BUILD_IN_SOURCE 1
+      CONFIGURE_COMMAND cd ${ARROW_SOURCE_DIR}/python && ${CMAKE_COMMAND} -E env ${pyarrow_ENV} ${PYTHON_EXECUTABLE} setup.py build
+      BUILD_COMMAND cd ${ARROW_SOURCE_DIR}/python && ${CMAKE_COMMAND} -E env ${pyarrow_ENV} ${PYTHON_EXECUTABLE} setup.py build_ext
+      INSTALL_COMMAND bash -c "cp -rf \$(find ${ARROW_SOURCE_DIR}/python/build/ -maxdepth 1 -type d -print | grep -m1 'lib')/pyarrow ${CMAKE_SOURCE_DIR}/python/ray/pyarrow_files/")
+
+  endif()
 
 endif ()
diff --git a/doc/requirements-doc.txt b/doc/requirements-doc.txt
index 5d953d3463400..f598baa081679 100644
--- a/doc/requirements-doc.txt
+++ b/doc/requirements-doc.txt
@@ -9,6 +9,7 @@ pyarrow
 pyyaml
 recommonmark
 redis
+setproctitle
 sphinx
 sphinx-click
 sphinx_rtd_theme
diff --git a/doc/source/actors.rst b/doc/source/actors.rst
index c7594592f5124..0d8b3c94285b5 100644
--- a/doc/source/actors.rst
+++ b/doc/source/actors.rst
@@ -65,8 +65,7 @@ When ``a1.increment.remote()`` is called, the following events happens.
 
 1. A task is created.
 2. The task is assigned directly to the local scheduler responsible for the
-   actor by the driver's local scheduler. Thus, this scheduling procedure
-   bypasses the global scheduler.
+   actor by the driver's local scheduler.
 3. An object ID is returned.
 
 We can then call ``ray.get`` on the object ID to retrieve the actual value.
diff --git a/doc/source/async_api.rst b/doc/source/async_api.rst
new file mode 100644
index 0000000000000..95867745f8ee6
--- /dev/null
+++ b/doc/source/async_api.rst
@@ -0,0 +1,87 @@
+Async API (Experimental)
+========================
+
+Since Python 3.5, it is possible to write concurrent code using the ``async/await`` `syntax <https://docs.python.org/3/library/asyncio.html>`__.
+
+This document describes Ray's support for asyncio, which enables integration with popular async frameworks (e.g., aiohttp, aioredis, etc.) for high performance web and prediction serving.
+
+Starting Ray
+------------
+
+You must initialize Ray first.
+
+Please refer to `Starting Ray`_ for instructions.
+
+.. _`Starting Ray`: http://ray.readthedocs.io/en/latest/tutorial.html#starting-ray
+
+
+Converting Ray objects into asyncio futures
+-------------------------------------------
+
+Ray object IDs can be converted into asyncio futures with ``ray.experimental.async_api``.
+
+.. code-block:: python
+
+  import asyncio
+  import time
+  import ray
+  from ray.experimental import async_api
+
+  @ray.remote
+  def f():
+      time.sleep(1)
+      return {'key1': ['value']}
+
+  ray.init()
+  future = async_api.as_future(f.remote())
+  asyncio.get_event_loop().run_until_complete(future)  # {'key1': ['value']}
+
+
+.. autofunction:: ray.experimental.async_api.as_future
+
+
+Example Usage
+-------------
+
++----------------------------------------+-----------------------------------------------------+
+| **Basic Python**                       | **Distributed with Ray**                            |
++----------------------------------------+-----------------------------------------------------+
+| .. code-block:: python                 | .. code-block:: python                              |
+|                                        |                                                     |
+|   # Execute f serially.                |   # Execute f in parallel.                          |
+|                                        |                                                     |
+|                                        |                                                     |
+|   def f():                             |   @ray.remote                                       |
+|     time.sleep(1)                      |   def f():                                          |
+|     return 1                           |       time.sleep(1)                                 |
+|                                        |       return 1                                      |
+|                                        |                                                     |
+|                                        |   ray.init()                                        |
+|   results = [f() for i in range(4)]    |   results = ray.get([f.remote() for i in range(4)]) |
++----------------------------------------+-----------------------------------------------------+
+| **Async Python**                       | **Async Ray**                                       |
++----------------------------------------+-----------------------------------------------------+
+| .. code-block:: python                 | .. code-block:: python                              |
+|                                        |                                                     |
+|   # Execute f asynchronously.          |   # Execute f asynchronously with Ray/asyncio.      |
+|                                        |                                                     |
+|                                        |   from ray.experimental import async_api            |
+|                                        |                                                     |
+|                                        |   @ray.remote                                       |
+|   async def f():                       |   def f():                                          |
+|       await asyncio.sleep(1)           |       time.sleep(1)                                 |
+|       return 1                         |       return 1                                      |
+|                                        |                                                     |
+|                                        |   ray.init()                                        |
+|   loop = asyncio.get_event_loop()      |   loop = asyncio.get_event_loop()                   |
+|   tasks = [f() for i in range(4)]      |   tasks = [async_api.as_future(f.remote())          |
+|                                        |            for i in range(4)]                       |
+|   results = loop.run_until_complete(   |   results = loop.run_until_complete(                |
+|       asyncio.gather(tasks))           |       asyncio.gather(tasks))                        |
++----------------------------------------+-----------------------------------------------------+
+
+
+Known Issues
+------------
+
+Async API support is experimental, and we are working to improve its performance. Please `let us know <https://github.com/ray-project/ray/issues>`__ any issues you encounter.
diff --git a/doc/source/autoscaling.rst b/doc/source/autoscaling.rst
index 54ebcc350e5e0..90c8e92f3d278 100644
--- a/doc/source/autoscaling.rst
+++ b/doc/source/autoscaling.rst
@@ -76,6 +76,14 @@ You can use ``ray exec`` to conveniently run commands on clusters. Note that scr
     # Run a command in a screen (experimental)
     $ ray exec cluster.yaml 'echo "hello world"' --screen
 
+You can also use ``ray submit`` to execute Python scripts on clusters. This will ``rsync`` the designated file onto the cluster and execute it with the given arguments.
+
+.. code-block:: bash
+
+    # Run a Python script in a detached tmux session
+    $ ray submit cluster.yaml --tmux --start --stop tune_experiment.py
+
+
 Attaching to the cluster
 ------------------------
 
@@ -136,7 +144,8 @@ The default idle timeout is 5 minutes. This is to prevent excessive node churn w
 Monitoring cluster status
 -------------------------
 
-You can monitor cluster usage and auto-scaling status by tailing the autoscaling logs in ``/tmp/raylogs/monitor-*``.
+You can monitor cluster usage and auto-scaling status by tailing the autoscaling
+logs in ``/tmp/ray/session_*/logs/monitor*``.
 
 The Ray autoscaler also reports per-node status in the form of instance tags. In your cloud provider console, you can click on a Node, go the the "Tags" pane, and add the ``ray-node-status`` tag as a column. This lets you see per-node statuses at a glance:
 
diff --git a/doc/source/conf.py b/doc/source/conf.py
index 27d0c1200d9c9..2a2b1a37c207e 100644
--- a/doc/source/conf.py
+++ b/doc/source/conf.py
@@ -18,44 +18,41 @@
 
 # These lines added to enable Sphinx to work without installing Ray.
 import mock
-MOCK_MODULES = ["gym",
-                "gym.spaces",
-                "scipy",
-                "scipy.signal",
-                "tensorflow",
-                "tensorflow.contrib",
-                "tensorflow.contrib.layers",
-                "tensorflow.contrib.slim",
-                "tensorflow.contrib.rnn",
-                "tensorflow.core",
-                "tensorflow.core.util",
-                "tensorflow.python",
-                "tensorflow.python.client",
-                "tensorflow.python.util",
-                "ray.local_scheduler",
-                "ray.plasma",
-                "ray.core",
-                "ray.core.generated",
-                "ray.core.generated.DriverTableMessage",
-                "ray.core.generated.LocalSchedulerInfoMessage",
-                "ray.core.generated.ResultTableReply",
-                "ray.core.generated.SubscribeToDBClientTableReply",
-                "ray.core.generated.SubscribeToNotificationsReply",
-                "ray.core.generated.TaskInfo",
-                "ray.core.generated.TaskReply",
-                "ray.core.generated.TaskExecutionDependencies",
-                "ray.core.generated.ClientTableData",
-                "ray.core.generated.GcsTableEntry",
-                "ray.core.generated.HeartbeatTableData",
-                "ray.core.generated.DriverTableData",
-                "ray.core.generated.ErrorTableData",
-                "ray.core.generated.ProfileTableData",
-                "ray.core.generated.ObjectTableData",
-                "ray.core.generated.ray.protocol.Task",
-                "ray.core.generated.TablePrefix",
-                "ray.core.generated.TablePubsub",]
+MOCK_MODULES = [
+    "gym",
+    "gym.spaces",
+    "scipy",
+    "scipy.signal",
+    "tensorflow",
+    "tensorflow.contrib",
+    "tensorflow.contrib.all_reduce",
+    "tensorflow.contrib.all_reduce.python",
+    "tensorflow.contrib.layers",
+    "tensorflow.contrib.slim",
+    "tensorflow.contrib.rnn",
+    "tensorflow.core",
+    "tensorflow.core.util",
+    "tensorflow.python",
+    "tensorflow.python.client",
+    "tensorflow.python.util",
+    "ray.raylet",
+    "ray.plasma",
+    "ray.core",
+    "ray.core.generated",
+    "ray.core.generated.ClientTableData",
+    "ray.core.generated.GcsTableEntry",
+    "ray.core.generated.HeartbeatTableData",
+    "ray.core.generated.HeartbeatBatchTableData",
+    "ray.core.generated.DriverTableData",
+    "ray.core.generated.ErrorTableData",
+    "ray.core.generated.ProfileTableData",
+    "ray.core.generated.ObjectTableData",
+    "ray.core.generated.ray.protocol.Task",
+    "ray.core.generated.TablePrefix",
+    "ray.core.generated.TablePubsub",
+]
 for mod_name in MOCK_MODULES:
-  sys.modules[mod_name] = mock.Mock()
+    sys.modules[mod_name] = mock.Mock()
 # ray.rllib.models.action_dist.py and
 # ray.rllib.models.lstm.py will use tf.VERSION
 sys.modules["tensorflow"].VERSION = "9.9.9"
@@ -89,7 +86,7 @@
 source_suffix = ['.rst', '.md']
 
 source_parsers = {
-   '.md': CommonMarkParser,
+    '.md': CommonMarkParser,
 }
 
 # The encoding of source files.
@@ -259,25 +256,24 @@
 # -- Options for LaTeX output ---------------------------------------------
 
 latex_elements = {
-# The paper size ('letterpaper' or 'a4paper').
-#'papersize': 'letterpaper',
+    # The paper size ('letterpaper' or 'a4paper').
+    #'papersize': 'letterpaper',
 
-# The font size ('10pt', '11pt' or '12pt').
-#'pointsize': '10pt',
+    # The font size ('10pt', '11pt' or '12pt').
+    #'pointsize': '10pt',
 
-# Additional stuff for the LaTeX preamble.
-#'preamble': '',
+    # Additional stuff for the LaTeX preamble.
+    #'preamble': '',
 
-# Latex figure (float) alignment
-#'figure_align': 'htbp',
+    # Latex figure (float) alignment
+    #'figure_align': 'htbp',
 }
 
 # Grouping the document tree into LaTeX files. List of tuples
 # (source start file, target name, title,
 #  author, documentclass [howto, manual, or own class]).
 latex_documents = [
-  (master_doc, 'Ray.tex', u'Ray Documentation',
-   u'The Ray Team', 'manual'),
+    (master_doc, 'Ray.tex', u'Ray Documentation', u'The Ray Team', 'manual'),
 ]
 
 # The name of an image file (relative to this directory) to place at the top of
@@ -300,29 +296,23 @@
 # If false, no module index is generated.
 #latex_domain_indices = True
 
-
 # -- Options for manual page output ---------------------------------------
 
 # One entry per manual page. List of tuples
 # (source start file, name, description, authors, manual section).
-man_pages = [
-    (master_doc, 'ray', u'Ray Documentation',
-     [author], 1)
-]
+man_pages = [(master_doc, 'ray', u'Ray Documentation', [author], 1)]
 
 # If true, show URL addresses after external links.
 #man_show_urls = False
 
-
 # -- Options for Texinfo output -------------------------------------------
 
 # Grouping the document tree into Texinfo files. List of tuples
 # (source start file, target name, title, author,
 #  dir menu entry, description, category)
 texinfo_documents = [
-  (master_doc, 'Ray', u'Ray Documentation',
-   author, 'Ray', 'One line description of project.',
-   'Miscellaneous'),
+    (master_doc, 'Ray', u'Ray Documentation', author, 'Ray',
+     'One line description of project.', 'Miscellaneous'),
 ]
 
 # Documents to append as an appendix to all manuals.
diff --git a/doc/source/custom_metric.png b/doc/source/custom_metric.png
new file mode 100644
index 0000000000000..3f448613711a3
Binary files /dev/null and b/doc/source/custom_metric.png differ
diff --git a/doc/source/distributed_sgd.rst b/doc/source/distributed_sgd.rst
new file mode 100644
index 0000000000000..5d1e480766258
--- /dev/null
+++ b/doc/source/distributed_sgd.rst
@@ -0,0 +1,56 @@
+Distributed SGD (Experimental)
+==============================
+
+Ray includes an implementation of synchronous distributed stochastic gradient descent (SGD), which is competitive in performance with implementations in Horovod and Distributed TensorFlow.
+
+Ray SGD is built on top of the Ray task and actor abstractions to provide seamless integration into existing Ray applications.
+
+Interface
+---------
+
+To use Ray SGD, define a `model class <https://github.com/ray-project/ray/blob/master/python/ray/experimental/sgd/model.py>`__ with ``loss`` and ``optimizer`` attributes:
+
+.. autoclass:: ray.experimental.sgd.Model
+
+Then, pass a model creator function to the ``ray.experimental.sgd.DistributedSGD`` class. To drive the distributed training, ``sgd.step()`` can be called repeatedly:
+
+.. code-block:: python
+
+    model_creator = lambda worker_idx, device_idx: YourModelClass()
+
+    sgd = DistributedSGD(
+        model_creator,
+        num_workers=2,
+        devices_per_worker=4,
+        gpu=True,
+        strategy="ps")
+
+    for i in range(NUM_ITERS):
+        sgd.step()
+
+Under the hood, Ray SGD will create *replicas* of your model onto each hardware device (GPU) allocated to workers (controlled by ``num_workers``). Multiple devices can be managed by each worker process (controlled by ``devices_per_worker``). Each model instance will be in a separate TF variable scope. The ``DistributedSGD`` class coordinates the distributed computation and application of gradients to improve the model.
+
+There are two distributed SGD strategies available for use:
+    - ``strategy="simple"``: Gradients are averaged centrally on the driver before being applied to each model replica. This is a reference implementation for debugging purposes.
+    - ``strategy="ps"``: Gradients are computed and averaged within each node. Gradients are then averaged across nodes through a number of parameter server actors. To pipeline the computation of gradients and transmission across the network, we use a custom TensorFlow op that can read and write to the Ray object store directly.
+
+Note that when ``num_workers=1``, only local allreduce will be used and the choice of distributed strategy is irrelevant.
+
+The full documentation for ``DistributedSGD`` is as follows:
+
+.. autoclass:: ray.experimental.sgd.DistributedSGD
+
+Examples
+--------
+
+For examples of end-to-end usage, check out the `ImageNet synthetic data test <https://github.com/ray-project/ray/blob/master/python/ray/experimental/sgd/test_sgd.py>`__ and also the simple `MNIST training example <https://github.com/ray-project/ray/blob/master/python/ray/experimental/sgd/mnist_example.py>`__, which includes examples of how access the model weights and monitor accuracy as training progresses.
+
+Performance
+-----------
+
+When using the new Ray backend (which will be enabled by default in Ray 0.6+), we `expect <https://github.com/ray-project/ray/pull/3033>`__ performance competitive with other synchronous SGD implementations on 25Gbps Ethernet.
+
+.. figure:: sgd.png
+    :width: 756px
+
+    Images per second reached when distributing the training of a ResNet-101 TensorFlow model (from the official TF benchmark). All experiments were run on p3.16xl instances connected by 25Gbps Ethernet, and workers allocated 4 GPUs per node as done in the Horovod benchmark.
diff --git a/doc/source/example-a3c.rst b/doc/source/example-a3c.rst
index 665d49a365512..47378fce9f915 100644
--- a/doc/source/example-a3c.rst
+++ b/doc/source/example-a3c.rst
@@ -9,11 +9,11 @@ View the `code for this example`_.
 
 .. _`A3C`: https://arxiv.org/abs/1602.01783
 .. _`Universe Starter Agent`: https://github.com/openai/universe-starter-agent
-.. _`code for this example`: https://github.com/ray-project/ray/tree/master/python/ray/rllib/a3c
+.. _`code for this example`: https://github.com/ray-project/ray/tree/master/python/ray/rllib/agents/a3c
 
 .. note::
 
-    For an overview of Ray's reinforcement learning library, see `Ray RLlib <http://ray.readthedocs.io/en/latest/rllib.html>`__.
+    For an overview of Ray's reinforcement learning library, see `RLlib <http://ray.readthedocs.io/en/latest/rllib.html>`__.
 
 To run the application, first install **ray** and then some dependencies:
 
@@ -29,7 +29,7 @@ You can run the code with
 
 .. code-block:: bash
 
-  python/ray/rllib/train.py --env=Pong-ram-v4 --run=A3C --config='{"num_workers": N}'
+  rllib train --env=Pong-ram-v4 --run=A3C --config='{"num_workers": N}'
 
 Reinforcement Learning
 ----------------------
diff --git a/doc/source/example-evolution-strategies.rst b/doc/source/example-evolution-strategies.rst
index 16cdc3126d8f5..d048d261fff95 100644
--- a/doc/source/example-evolution-strategies.rst
+++ b/doc/source/example-evolution-strategies.rst
@@ -11,20 +11,20 @@ To run the application, first install some dependencies.
 
 You can view the `code for this example`_.
 
-.. _`code for this example`: https://github.com/ray-project/ray/tree/master/python/ray/rllib/es
+.. _`code for this example`: https://github.com/ray-project/ray/tree/master/python/ray/rllib/agents/es
 
 The script can be run as follows. Note that the configuration is tuned to work
 on the ``Humanoid-v1`` gym environment.
 
 .. code-block:: bash
 
-  python/ray/rllib/train.py --env=Humanoid-v1 --run=ES
+  rllib train --env=Humanoid-v1 --run=ES
 
 To train a policy on a cluster (e.g., using 900 workers), run the following.
 
 .. code-block:: bash
 
-  python ray/python/ray/rllib/train.py \
+  rllib train \
       --env=Humanoid-v1 \
       --run=ES \
       --redis-address=<redis-address> \
diff --git a/doc/source/example-policy-gradient.rst b/doc/source/example-policy-gradient.rst
index 806764560ba95..9b58575044c3b 100644
--- a/doc/source/example-policy-gradient.rst
+++ b/doc/source/example-policy-gradient.rst
@@ -6,7 +6,7 @@ View the `code for this example`_.
 
 .. note::
 
-    For an overview of Ray's reinforcement learning library, see `Ray RLlib <http://ray.readthedocs.io/en/latest/rllib.html>`__.
+    For an overview of Ray's reinforcement learning library, see `RLlib <http://ray.readthedocs.io/en/latest/rllib.html>`__.
 
 
 To run this example, you will need to install `TensorFlow with GPU support`_ (at
@@ -21,7 +21,7 @@ Then you can run the example as follows.
 
 .. code-block:: bash
 
-  python/ray/rllib/train.py --env=Pong-ram-v4 --run=PPO
+  rllib train --env=Pong-ram-v4 --run=PPO
 
 This will train an agent on the ``Pong-ram-v4`` Atari environment. You can also
 try passing in the ``Pong-v0`` environment or the ``CartPole-v0`` environment.
@@ -39,4 +39,4 @@ Many of the TensorBoard metrics are also printed to the console, but you might
 find it easier to visualize and compare between runs using the TensorBoard UI.
 
 .. _`TensorFlow with GPU support`: https://www.tensorflow.org/install/
-.. _`code for this example`: https://github.com/ray-project/ray/tree/master/python/ray/rllib/ppo
+.. _`code for this example`: https://github.com/ray-project/ray/tree/master/python/ray/rllib/agents/ppo
diff --git a/doc/source/fault-tolerance.rst b/doc/source/fault-tolerance.rst
index a4692f904feea..6c388c9f8883e 100644
--- a/doc/source/fault-tolerance.rst
+++ b/doc/source/fault-tolerance.rst
@@ -6,16 +6,9 @@ This document describes the handling of failures in Ray.
 Machine and Process Failures
 ----------------------------
 
-Currently, each **local scheduler** and each **plasma manager** send heartbeats
-to a **monitor** process. If the monitor does not receive any heartbeats from a
-given process for some duration of time (about ten seconds), then it will mark
-that process as dead. The monitor process will then clean up the associated
-state in the Redis servers. If a manager is marked as dead, the object table
-will be updated to remove all occurrences of that manager so that other managers
-don't try to fetch objects from the dead manager. If a local scheduler is marked
-as dead, all of the tasks that are marked as executing on that local scheduler
-in the task table will be marked as lost and all actors associated with that
-local scheduler will be recreated by other local schedulers.
+Each **raylet** (the scheduler process) sends heartbeats to a **monitor**
+process. If the monitor does not receive any heartbeats from a given raylet for
+some period of time (about ten seconds), then it will mark that process as dead.
 
 Lost Objects
 ------------
@@ -23,19 +16,16 @@ Lost Objects
 If an object is needed but is lost or was never created, then the task that
 created the object will be re-executed to create the object. If necessary, tasks
 needed to create the input arguments to the task being re-executed will also be
-re-executed.
+re-executed. This is the standard *lineage-based fault tolerance* strategy used
+by other systems like Spark.
 
 Actors
 ------
 
-When a local scheduler is marked as dead, all actors associated with that local
-scheduler that were still alive will be recreated by other local schedulers. By
-default, all of the actor methods will be re-executed in the same order that
-they were initially executed. If actor checkpointing is enabled, then the actor
-state will be loaded from the most recent checkpoint and the actor methods that
-occurred after the checkpoint will be re-executed. Note that actor checkpointing
-is currently an experimental feature.
-
+When an actor dies (either because the actor process crashed or because the node
+that the actor was on died), by default any attempt to get an object from that
+actor that cannot be created will raise an exception. Subsequent releases will
+include an option for automatically restarting actors.
 
 Current Limitations
 -------------------
@@ -47,7 +37,7 @@ Process Failures
 ~~~~~~~~~~~~~~~~
 
 1. Ray does not recover from the failure of any of the following processes:
-   a Redis server, the global scheduler, the monitor process.
+   a Redis server and the monitor process.
 2. If a driver fails, that driver will not be restarted and the job will not
    complete.
 
@@ -58,9 +48,3 @@ Lost Objects
    evicted, and is later needed, Ray will not reconstruct this object.
 2. If an object is constructed by an actor method, is then evicted, and is later
    needed, Ray will not reconstruct this object.
-
-Actor Reconstruction
-~~~~~~~~~~~~~~~~~~~~
-
-1. Actor reconstruction follows the order of initial execution, but new tasks
-   may get interleaved with the re-executed tasks.
diff --git a/doc/source/images/ray_logo.png b/doc/source/images/ray_logo.png
new file mode 100644
index 0000000000000..05840a7ff453e
Binary files /dev/null and b/doc/source/images/ray_logo.png differ
diff --git a/doc/source/impala.png b/doc/source/impala.png
index a7d12e4b5a0f9..0d42fe6e07dc9 100644
Binary files a/doc/source/impala.png and b/doc/source/impala.png differ
diff --git a/doc/source/index.rst b/doc/source/index.rst
index b71987108be05..68a33676c80d8 100644
--- a/doc/source/index.rst
+++ b/doc/source/index.rst
@@ -42,6 +42,7 @@ Ray comes with libraries that accelerate deep learning and reinforcement learnin
 
 - `Tune`_: Scalable Hyperparameter Search
 - `RLlib`_: Scalable Reinforcement Learning
+- `Distributed Training <distributed_sgd.html>`__
 
 .. _`Tune`: tune.html
 .. _`RLlib`: rllib.html
@@ -64,6 +65,7 @@ Ray comes with libraries that accelerate deep learning and reinforcement learnin
    actors.rst
    using-ray-with-gpus.rst
    webui.rst
+   async_api.rst
 
 .. toctree::
    :maxdepth: 1
@@ -74,10 +76,11 @@ Ray comes with libraries that accelerate deep learning and reinforcement learnin
    tune-schedulers.rst
    tune-searchalg.rst
    tune-package-ref.rst
+   tune-examples.rst
 
 .. toctree::
    :maxdepth: 1
-   :caption: Ray RLlib
+   :caption: RLlib
 
    rllib.rst
    rllib-training.rst
@@ -89,8 +92,9 @@ Ray comes with libraries that accelerate deep learning and reinforcement learnin
 
 .. toctree::
    :maxdepth: 1
-   :caption: Pandas on Ray
+   :caption: Other Libraries
 
+   distributed_sgd.rst
    pandas_on_ray.rst
 
 .. toctree::
@@ -118,6 +122,7 @@ Ray comes with libraries that accelerate deep learning and reinforcement learnin
    plasma-object-store.rst
    resources.rst
    redis-memory-management.rst
+   tempfile.rst
 
 .. toctree::
    :maxdepth: 1
@@ -134,6 +139,7 @@ Ray comes with libraries that accelerate deep learning and reinforcement learnin
 
    troubleshooting.rst
    user-profiling.rst
+   security.rst
    development.rst
    profiling.rst
    contact.rst
diff --git a/doc/source/installation.rst b/doc/source/installation.rst
index 4c4bc3f165ef7..68bd37ae96f5d 100644
--- a/doc/source/installation.rst
+++ b/doc/source/installation.rst
@@ -3,17 +3,23 @@ Installing Ray
 
 Ray should work with Python 2 and Python 3. We have tested Ray on Ubuntu 14.04, Ubuntu 16.04, OS X 10.11 and 10.12.
 
-You can install Ray as follows.
+Latest stable version
+---------------------
+
+You can install the latest stable version of Ray as follows.
 
 .. code-block:: bash
 
-  pip install ray
+  pip install -U ray  # also recommended: ray[debug]
+
+Trying snapshots from master
+----------------------------
+
+Here are links to the latest wheels (which are built off of master). To install these wheels, run the following command:
 
-Trying the latest version of Ray
---------------------------------
+.. danger::
 
-Here are links to the latest wheels (which are built off of master). These versions will have newer
-features but may be subject to more bugs. To install these wheels, run the following command:
+    These versions will have newer features but are subject to more bugs. If you encounter crashes or other instabilities, please revert to the latest stable version.
 
 .. code-block:: bash
 
@@ -23,6 +29,7 @@ features but may be subject to more bugs. To install these wheels, run the follo
 ===================  ===================
        Linux                MacOS
 ===================  ===================
+`Linux Python 3.7`_  `MacOS Python 3.7`_
 `Linux Python 3.6`_  `MacOS Python 3.6`_
 `Linux Python 3.5`_  `MacOS Python 3.5`_
 `Linux Python 3.4`_  `MacOS Python 3.4`_
@@ -30,14 +37,16 @@ features but may be subject to more bugs. To install these wheels, run the follo
 ===================  ===================
 
 
-.. _`Linux Python 3.6`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp36-cp36m-manylinux1_x86_64.whl
-.. _`Linux Python 3.5`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp35-cp35m-manylinux1_x86_64.whl
-.. _`Linux Python 3.4`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp34-cp34m-manylinux1_x86_64.whl
-.. _`Linux Python 2.7`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp27-cp27mu-manylinux1_x86_64.whl
-.. _`MacOS Python 3.6`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp36-cp36m-macosx_10_6_intel.whl
-.. _`MacOS Python 3.5`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp35-cp35m-macosx_10_6_intel.whl
-.. _`MacOS Python 3.4`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp34-cp34m-macosx_10_6_intel.whl
-.. _`MacOS Python 2.7`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp27-cp27m-macosx_10_6_intel.whl
+.. _`Linux Python 3.7`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp37-cp37m-manylinux1_x86_64.whl
+.. _`Linux Python 3.6`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp36-cp36m-manylinux1_x86_64.whl
+.. _`Linux Python 3.5`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp35-cp35m-manylinux1_x86_64.whl
+.. _`Linux Python 3.4`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp34-cp34m-manylinux1_x86_64.whl
+.. _`Linux Python 2.7`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp27-cp27mu-manylinux1_x86_64.whl
+.. _`MacOS Python 3.7`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp37-cp37m-macosx_10_6_intel.whl
+.. _`MacOS Python 3.6`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp36-cp36m-macosx_10_6_intel.whl
+.. _`MacOS Python 3.5`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp35-cp35m-macosx_10_6_intel.whl
+.. _`MacOS Python 3.4`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp34-cp34m-macosx_10_6_intel.whl
+.. _`MacOS Python 2.7`: https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp27-cp27m-macosx_10_6_intel.whl
 
 
 Building Ray from source
@@ -67,7 +76,7 @@ For Ubuntu, run the following commands:
   # If you are on Ubuntu 14.04, you need the following.
   pip install cmake
 
-  pip install cython
+  pip install cython==0.27.3
 
 For MacOS, run the following commands:
 
@@ -76,7 +85,7 @@ For MacOS, run the following commands:
   brew update
   brew install cmake pkg-config automake autoconf libtool openssl bison wget
 
-  pip install cython
+  pip install cython==0.27.3
 
 
 If you are using Anaconda, you may also need to run the following.
diff --git a/doc/source/internals-overview.rst b/doc/source/internals-overview.rst
index 69ac1895a55c7..a2516de1d10ce 100644
--- a/doc/source/internals-overview.rst
+++ b/doc/source/internals-overview.rst
@@ -15,8 +15,8 @@ Running Ray standalone
 
 Ray can be used standalone by calling ``ray.init()`` within a script. When the
 call to ``ray.init()`` happens, all of the relevant processes are started.
-These include a local scheduler, a global scheduler, an object store and
-manager, a Redis server, and a number of worker processes.
+These include a local scheduler, an object store and manager, a Redis server,
+and a number of worker processes.
 
 When the script exits, these processes will be killed.
 
@@ -112,7 +112,7 @@ When a driver or worker invokes a remote function, a number of things happen.
 - The task object is then sent to the local scheduler on the same node as the
   driver or worker.
 - The local scheduler makes a decision to either schedule the task locally or to
-  pass the task on to a global scheduler.
+  pass the task on to another local scheduler.
 
   - If all of the task's object dependencies are present in the local object
     store and there are enough CPU and GPU resources available to execute the
diff --git a/doc/source/profiling.rst b/doc/source/profiling.rst
index 59d12d635cdeb..55ed8de6fae2b 100644
--- a/doc/source/profiling.rst
+++ b/doc/source/profiling.rst
@@ -14,54 +14,20 @@ symbolize on Mac OS have failed.
 
   sudo apt-get install google-perftools libgoogle-perftools-dev
 
-Changes to compilation and linking
-----------------------------------
-
-Let's say we want to profile the ``plasma_manager``.  Change the link
-instruction in ``src/plasma/CMakeLists.txt`` from
-
-.. code-block:: cmake
-
-  target_link_libraries(plasma_manager common ${PLASMA_STATIC_LIB} ray_static ${ARROW_STATIC_LIB} -lpthread)
-
-to additionally include ``-lprofiler``:
-
-.. code-block:: cmake
-
-  target_link_libraries(plasma_manager common ${PLASMA_STATIC_LIB} ray_static ${ARROW_STATIC_LIB} -lpthread -lprofiler)
-
-Additionally, add ``-g -ggdb`` to ``CMAKE_C_FLAGS`` and ``CMAKE_CXX_FLAGS`` to
-enable the debug symbols.  (Keeping ``-O3`` seems okay.)
-
-Recompile.
-
 Launching the to-profile binary
 -------------------------------
 
-In various places, instead of launching the target binary via
-``plasma_manager <args>``, it must be launched with
+If you want to launch Ray in profiling mode, define the following variables:
 
 .. code-block:: bash
 
-  LD_PRELOAD=/usr/lib/libprofiler.so CPUPROFILE=/tmp/pprof.out plasma_manager <args>
-
-In practice, this means modifying ``python/ray/plasma/plasma.py`` so that the
-manager is launched with a command that passes a ``modified_env`` into
-``Popen``.
-
-.. code-block:: python
-
-  modified_env = os.environ.copy()
-  modified_env["LD_PRELOAD"] = "/usr/lib/libprofiler.so"
-  modified_env["CPUPROFILE"] = "/tmp/pprof.out"
+  export RAYLET_PERFTOOLS_PATH=/usr/lib/x86_64-linux-gnu/libprofiler.so
+  export RAYLET_PERFTOOLS_LOGFILE=/tmp/pprof.out
 
-  process = subprocess.Popen(command,
-                             stdout=stdout_file,
-                             stderr=stderr_file,
-                             env=modified_env)
 
 The file ``/tmp/pprof.out`` will be empty until you let the binary run the
-target workload for a while and then ``kill`` it.
+target workload for a while and then ``kill`` it via ``ray stop`` or by
+letting the driver exit.
 
 Visualizing the CPU profile
 ---------------------------
@@ -72,14 +38,14 @@ zoomable ``.svg`` image displaying the call graph annotated with hot paths.
 .. code-block:: bash
 
   # Use the appropriate path.
-  PLASMA_MANAGER=ray/python/ray/core/src/plasma/plasma_manager
+  RAYLET=ray/python/ray/core/src/ray/raylet/raylet
 
-  google-pprof -svg $PLASMA_MANAGER /tmp/pprof.out > /tmp/pprof.svg
+  google-pprof -svg $RAYLET /tmp/pprof.out > /tmp/pprof.svg
   # Then open the .svg file with Chrome.
 
   # If you realize the call graph is too large, use -focus=<some function> to zoom
   # into subtrees.
-  google-pprof -focus=epoll_wait -svg $PLASMA_MANAGER /tmp/pprof.out > /tmp/pprof.svg
+  google-pprof -focus=epoll_wait -svg $RAYLET /tmp/pprof.out > /tmp/pprof.svg
 
 Here's a snapshot of an example svg output, taken from the official
 documentation:
diff --git a/doc/source/redis-memory-management.rst b/doc/source/redis-memory-management.rst
index 64d2035ed0f31..5e6edcc02f6c4 100644
--- a/doc/source/redis-memory-management.rst
+++ b/doc/source/redis-memory-management.rst
@@ -1,4 +1,4 @@
-Redis Memory Management (EXPERIMENTAL)
+Redis Memory Management (Experimental)
 ======================================
 
 Ray stores metadata associated with tasks and objects in one or more Redis
@@ -7,92 +7,9 @@ servers, as described in `An Overview of the Internals
 task/object generation rate could risk high memory pressure, potentially leading
 to out-of-memory (OOM) errors.
 
-Here, we describe an experimental feature that transparently flushes metadata
-entries out of Redis memory.
+In Ray `0.6.1+` Redis shards can be configured to LRU evict task and object
+metadata by setting ``redis_max_memory`` when starting Ray. This supercedes the
+previously documented flushing functionality.
 
-Requirements
-------------
-
-As of early July 2018, the automatic memory management feature requires building
-Ray from source.  We are planning on eliminating this step in the near future by
-releasing official wheels.
-
-Building Ray
-~~~~~~~~~~~~
-
-First, follow `instructions to build Ray from source
-<installation.html#building-ray-from-source>`__ to install prerequisites.  After
-the prerequisites are installed, instead of doing the regular ``pip install`` as
-referenced in that document, pass an additional special flag,
-``RAY_USE_NEW_GCS=on``:
-
-.. code-block:: bash
-
-  git clone https://github.com/ray-project/ray.git
-  cd ray/python
-  RAY_USE_NEW_GCS=on pip install -e . --verbose  # Add --user if you see a permission denied error.
-
-Running Ray applications
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-At run time the environment variables ``RAY_USE_NEW_GCS=on`` and
-``RAY_USE_XRAY=1`` are required.
-
-.. code-block:: bash
-
-  export RAY_USE_NEW_GCS=on
-  export RAY_USE_XRAY=1
-  python my_ray_script.py  # Or launch python/ipython.
-
-Activate memory flushing
-------------------------
-
-After building Ray using the method above, simply add these two lines after
-``ray.init()`` to activate automatic memory flushing:
-
-.. code-block:: python
-
-   ray.init(...)
-
-   policy = ray.experimental.SimpleGcsFlushPolicy()
-   ray.experimental.set_flushing_policy(policy)
-
-   # My awesome Ray application logic follows.
-
-Paramaters of the flushing policy
----------------------------------
-
-There are three `user-configurable parameters
-<https://github.com/ray-project/ray/blob/8190ff1fd0c4b82f73e2c1c0f21de6bda494718c/python/ray/experimental/gcs_flush_policy.py#L31>`_
-of the ``SimpleGcsFlushPolicy``:
-
-* ``flush_when_at_least_bytes``: Wait until this many bytes of memory usage
-  accumulated in the redis server before flushing kicks in.
-* ``flush_period_secs``: Issue a flush to the Redis server every this many
-  seconds.
-* ``flush_num_entries_each_time``: A hint to the system on the number of entries
-  to flush on each request.
-
-The default values should serve to be non-invasive for lightweight Ray
-applications. ``flush_when_at_least_bytes`` is set to ``(1<<31)`` or 2GB,
-``flush_period_secs`` to 10, and ``flush_num_entries_each_time`` to 10000:
-
-.. code-block:: python
-
-    # Default parameters.
-    ray.experimental.SimpleGcsFlushPolicy(
-        flush_when_at_least_bytes=(1 << 31),
-        flush_period_secs=10,
-        flush_num_entries_each_time=10000)
-
-In particular, these default values imply that
-
-1. the Redis server would accumulate memory usage up to 2GB without any entries
-being flushed, then the flushing would kick in; and
-
-2. generally, "older" metadata entries would be flushed first, and the Redis
-server would always keep the most recent window of metadata of 2GB in size.
-
-**For advanced users.** Advanced users can tune the above parameters to their
-applications' needs; note that the desired flush rate is equal to (flush
-period) * (num entries each flush).
+Note that profiling is disabled when ``redis_max_memory`` is set. This is because
+profiling data cannot be LRU evicted.
diff --git a/doc/source/resources.rst b/doc/source/resources.rst
index e0dc9d742ec28..4be2f61afbe4b 100644
--- a/doc/source/resources.rst
+++ b/doc/source/resources.rst
@@ -1,5 +1,5 @@
-Resource (CPUs, GPUs)
-=====================
+Resources (CPUs, GPUs)
+======================
 
 This document describes how resources are managed in Ray. Each node in a Ray
 cluster knows its own resource capacities, and each task specifies its resource
@@ -39,7 +39,8 @@ Specifying a task's CPU and GPU requirements
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 To specify a task's CPU and GPU requirements, pass the ``num_cpus`` and
-``num_gpus`` arguments into the remote decorator.
+``num_gpus`` arguments into the remote decorator. Note that Ray supports
+**fractional** resource requirements.
 
 .. code-block:: python
 
@@ -47,7 +48,11 @@ To specify a task's CPU and GPU requirements, pass the ``num_cpus`` and
   def f():
       return 1
 
-When ``f`` tasks will be scheduled on machines that have at least 4 CPUs and 2
+  @ray.remote(num_gpus=0.5)
+  def h():
+      return 1
+
+The ``f`` tasks will be scheduled on machines that have at least 4 CPUs and 2
 GPUs, and when one of the ``f`` tasks executes, 4 CPUs and 2 GPUs will be
 reserved for that task. The IDs of the GPUs that are reserved for the task can
 be accessed with ``ray.get_gpu_ids()``. Ray will automatically set the
@@ -108,3 +113,9 @@ decorator.
   @ray.remote(resources={'Resource2': 1})
   def f():
       return 1
+
+Fractional Resources
+--------------------
+
+Task and actor resource requirements can be fractional. This is particularly
+useful if you want multiple tasks or actors to share a single GPU.
diff --git a/doc/source/rllib-algorithms.rst b/doc/source/rllib-algorithms.rst
index d764fc7ad8ea3..1d0501215745c 100644
--- a/doc/source/rllib-algorithms.rst
+++ b/doc/source/rllib-algorithms.rst
@@ -38,14 +38,21 @@ SpaceInvaders  646                               ~300
 
     Ape-X using 32 workers in RLlib vs vanilla DQN (orange) and A3C (blue) on PongNoFrameskip-v4.
 
+**Ape-X specific configs** (see also `common configs <rllib-training.html#common-parameters>`__):
+
+.. literalinclude:: ../../python/ray/rllib/agents/dqn/apex.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
+
 Importance Weighted Actor-Learner Architecture (IMPALA)
 -------------------------------------------------------
 
 `[paper] <https://arxiv.org/abs/1802.01561>`__
 `[implementation] <https://github.com/ray-project/ray/blob/master/python/ray/rllib/agents/impala/impala.py>`__
-In IMPALA, a central learner runs SGD in a tight loop while asynchronously pulling sample batches from many actor processes. RLlib's IMPALA implementation uses DeepMind's reference `V-trace code <https://github.com/deepmind/scalable_agent/blob/master/vtrace.py>`__. Note that we do not provide a deep residual network out of the box, but one can be plugged in as a `custom model <rllib-models.html#custom-models>`__.
+In IMPALA, a central learner runs SGD in a tight loop while asynchronously pulling sample batches from many actor processes. RLlib's IMPALA implementation uses DeepMind's reference `V-trace code <https://github.com/deepmind/scalable_agent/blob/master/vtrace.py>`__. Note that we do not provide a deep residual network out of the box, but one can be plugged in as a `custom model <rllib-models.html#custom-models>`__. Multiple learner GPUs and experience replay are also supported.
 
-Tuned examples: `PongNoFrameskip-v4 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pong-impala.yaml>`__, `vectorized configuration <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pong-impala-vectorized.yaml>`__, `{BeamRider,Breakout,Qbert,SpaceInvaders}NoFrameskip-v4 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/atari-impala.yaml>`__
+Tuned examples: `PongNoFrameskip-v4 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pong-impala.yaml>`__, `vectorized configuration <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pong-impala-vectorized.yaml>`__, `multi-gpu configuration <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pong-impala-fast.yaml>`__, `{BeamRider,Breakout,Qbert,SpaceInvaders}NoFrameskip-v4 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/atari-impala.yaml>`__
 
 **Atari results @10M steps**: `more details <https://github.com/ray-project/rl-experiments>`__
 
@@ -71,7 +78,15 @@ SpaceInvaders  843                              ~300
 
 .. figure:: impala.png
 
-   IMPALA solves Atari several times faster than A2C / A3C, with similar sample efficiency. Here IMPALA scales from 16 to 128 workers to solve PongNoFrameskip-v4 in ~8 minutes.
+   Multi-GPU IMPALA scales up to solve PongNoFrameskip-v4 in ~3 minutes using a pair of V100 GPUs and 128 CPU workers.
+   The maximum training throughput reached is ~30k transitions per second (~120k environment frames per second).
+
+**IMPALA-specific configs** (see also `common configs <rllib-training.html#common-parameters>`__):
+
+.. literalinclude:: ../../python/ray/rllib/agents/impala/impala.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
 
 Gradient-based
 ~~~~~~~~~~~~~~
@@ -97,17 +112,31 @@ Qbert          3620                      ~1000
 SpaceInvaders  692                       ~600
 =============  ========================  ==============================
 
-Deep Deterministic Policy Gradients (DDPG)
-------------------------------------------
+**A3C-specific configs** (see also `common configs <rllib-training.html#common-parameters>`__):
+
+.. literalinclude:: ../../python/ray/rllib/agents/a3c/a3c.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
+
+Deep Deterministic Policy Gradients (DDPG, TD3)
+-----------------------------------------------
 `[paper] <https://arxiv.org/abs/1509.02971>`__ `[implementation] <https://github.com/ray-project/ray/blob/master/python/ray/rllib/agents/ddpg/ddpg.py>`__
-DDPG is implemented similarly to DQN (below). The algorithm can be scaled by increasing the number of workers, switching to AsyncGradientsOptimizer, or using Ape-X.
+DDPG is implemented similarly to DQN (below). The algorithm can be scaled by increasing the number of workers, switching to AsyncGradientsOptimizer, or using Ape-X. The improvements from `TD3 <https://spinningup.openai.com/en/latest/algorithms/td3.html>`__ are available though not enabled by default.
+
+Tuned examples: `Pendulum-v0 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml>`__, `TD3 configuration <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pendulum-td3.yaml>`__, `MountainCarContinuous-v0 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml>`__, `HalfCheetah-v2 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml>`__
 
-Tuned examples: `Pendulum-v0 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml>`__, `MountainCarContinuous-v0 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml>`__, `HalfCheetah-v2 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml>`__
+**DDPG-specific configs** (see also `common configs <rllib-training.html#common-parameters>`__):
 
-Deep Q Networks (DQN, Rainbow)
-------------------------------
+.. literalinclude:: ../../python/ray/rllib/agents/ddpg/ddpg.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
+
+Deep Q Networks (DQN, Rainbow, Parametric DQN)
+----------------------------------------------
 `[paper] <https://arxiv.org/abs/1312.5602>`__ `[implementation] <https://github.com/ray-project/ray/blob/master/python/ray/rllib/agents/dqn/dqn.py>`__
-RLlib DQN is implemented using the SyncReplayOptimizer. The algorithm can be scaled by increasing the number of workers, using the AsyncGradientsOptimizer for async DQN, or using Ape-X. Memory usage is reduced by compressing samples in the replay buffer with LZ4. All of the DQN improvements evaluated in `Rainbow <https://arxiv.org/abs/1710.02298>`__ are available, though not all are enabled by default.
+RLlib DQN is implemented using the SyncReplayOptimizer. The algorithm can be scaled by increasing the number of workers, using the AsyncGradientsOptimizer for async DQN, or using Ape-X. Memory usage is reduced by compressing samples in the replay buffer with LZ4. All of the DQN improvements evaluated in `Rainbow <https://arxiv.org/abs/1710.02298>`__ are available, though not all are enabled by default. See also how to use `parametric-actions in DQN <rllib-models.html#variable-length-parametric-action-spaces>`__.
 
 Tuned examples: `PongDeterministic-v4 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pong-dqn.yaml>`__, `Rainbow configuration <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/pong-rainbow.yaml>`__, `{BeamRider,Breakout,Qbert,SpaceInvaders}NoFrameskip-v4 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/atari-basic-dqn.yaml>`__, `with Dueling and Double-Q <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/atari-duel-ddqn.yaml>`__, `with Distributional DQN <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/atari-dist-dqn.yaml>`__.
 
@@ -125,12 +154,26 @@ Qbert          3921                      7968                           15780
 SpaceInvaders  650                       1001                           1025                            ~500                           
 =============  ========================  =============================  ==============================  ===============================
 
+**DQN-specific configs** (see also `common configs <rllib-training.html#common-parameters>`__):
+
+.. literalinclude:: ../../python/ray/rllib/agents/dqn/dqn.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
+
 Policy Gradients
 ----------------
 `[paper] <https://papers.nips.cc/paper/1713-policy-gradient-methods-for-reinforcement-learning-with-function-approximation.pdf>`__ `[implementation] <https://github.com/ray-project/ray/blob/master/python/ray/rllib/agents/pg/pg.py>`__ We include a vanilla policy gradients implementation as an example algorithm. This is usually outperformed by PPO.
 
 Tuned examples: `CartPole-v0 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/regression_tests/cartpole-pg.yaml>`__
 
+**PG-specific configs** (see also `common configs <rllib-training.html#common-parameters>`__):
+
+.. literalinclude:: ../../python/ray/rllib/agents/pg/pg.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
+
 Proximal Policy Optimization (PPO)
 ----------------------------------
 `[paper] <https://arxiv.org/abs/1707.06347>`__ `[implementation] <https://github.com/ray-project/ray/blob/master/python/ray/rllib/agents/ppo/ppo.py>`__
@@ -158,6 +201,13 @@ SpaceInvaders  671             944             ~800
 
    RLlib's multi-GPU PPO scales to multiple GPUs and hundreds of CPUs on solving the Humanoid-v1 task. Here we compare against a reference MPI-based implementation.
 
+**PPO-specific configs** (see also `common configs <rllib-training.html#common-parameters>`__):
+
+.. literalinclude:: ../../python/ray/rllib/agents/ppo/ppo.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
+
 Derivative-free
 ~~~~~~~~~~~~~~~
 
@@ -168,6 +218,13 @@ ARS is a random search method for training linear policies for continuous contro
 
 Tuned examples: `CartPole-v0 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/regression_tests/cartpole-ars.yaml>`__, `Swimmer-v2 <https://github.com/ray-project/ray/blob/master/python/ray/rllib/tuned_examples/swimmer-ars.yaml>`__
 
+**ARS-specific configs** (see also `common configs <rllib-training.html#common-parameters>`__):
+
+.. literalinclude:: ../../python/ray/rllib/agents/ars/ars.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
+
 Evolution Strategies
 --------------------
 `[paper] <https://arxiv.org/abs/1703.03864>`__ `[implementation] <https://github.com/ray-project/ray/blob/master/python/ray/rllib/agents/es/es.py>`__
@@ -181,3 +238,10 @@ Tuned examples: `Humanoid-v1 <https://github.com/ray-project/ray/blob/master/pyt
    :width: 500px
 
    RLlib's ES implementation scales further and is faster than a reference Redis implementation on solving the Humanoid-v1 task.
+
+**ES-specific configs** (see also `common configs <rllib-training.html#common-parameters>`__):
+
+.. literalinclude:: ../../python/ray/rllib/agents/es/es.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
diff --git a/doc/source/rllib-concepts.rst b/doc/source/rllib-concepts.rst
index f752279cb58d3..68c160c912b05 100644
--- a/doc/source/rllib-concepts.rst
+++ b/doc/source/rllib-concepts.rst
@@ -17,7 +17,7 @@ Policy Evaluation
 
 Given an environment and policy graph, policy evaluation produces `batches <https://github.com/ray-project/ray/blob/master/python/ray/rllib/evaluation/sample_batch.py>`__ of experiences. This is your classic "environment interaction loop". Efficient policy evaluation can be burdensome to get right, especially when leveraging vectorization, RNNs, or when operating in a multi-agent environment. RLlib provides a `PolicyEvaluator <https://github.com/ray-project/ray/blob/master/python/ray/rllib/evaluation/policy_evaluator.py>`__ class that manages all of this, and this class is used in most RLlib algorithms.
 
-You can also use policy evaluation standalone to produce batches of experiences. This can be done by calling ``ev.sample()`` on an evaluator instance, or ``ev.sample.remote()`` in parallel on evaluator instances created as Ray actors (see ``PolicyEvalutor.as_remote()``).
+You can also use policy evaluation standalone to produce batches of experiences. This can be done by calling ``ev.sample()`` on an evaluator instance, or ``ev.sample.remote()`` in parallel on evaluator instances created as Ray actors (see ``PolicyEvaluator.as_remote()``).
 
 Policy Optimization
 -------------------
diff --git a/doc/source/rllib-env.rst b/doc/source/rllib-env.rst
index 6de076785707f..4f8a4c66ae4c3 100644
--- a/doc/source/rllib-env.rst
+++ b/doc/source/rllib-env.rst
@@ -5,27 +5,58 @@ RLlib works with several different types of environments, including `OpenAI Gym
 
 .. image:: rllib-envs.svg
 
-In the high-level agent APIs, environments are identified with string names. By default, the string will be interpreted as a gym `environment name <https://gym.openai.com/envs>`__, however you can also register custom environments by name:
+**Compatibility matrix**:
+
+=============  =======================  ==================  ===========  ==================
+Algorithm      Discrete Actions         Continuous Actions  Multi-Agent  Recurrent Policies
+=============  =======================  ==================  ===========  ==================
+A2C, A3C        **Yes** `+parametric`_  **Yes**             **Yes**      **Yes**
+PPO             **Yes** `+parametric`_  **Yes**             **Yes**      **Yes**
+PG              **Yes** `+parametric`_  **Yes**             **Yes**      **Yes**
+IMPALA          **Yes** `+parametric`_  No                  **Yes**      **Yes**
+DQN, Rainbow    **Yes** `+parametric`_  No                  **Yes**      No
+DDPG, TD3       No                      **Yes**             **Yes**      No
+APEX-DQN        **Yes** `+parametric`_  No                  **Yes**      No
+APEX-DDPG       No                      **Yes**             **Yes**      No
+ES              **Yes**                 **Yes**             No           No
+ARS             **Yes**                 **Yes**             No           No
+=============  =======================  ==================  ===========  ==================
+
+.. _`+parametric`: rllib-models.html#variable-length-parametric-action-spaces
+
+You can pass either a string name or a Python class to specify an environment. By default, strings will be interpreted as a gym `environment name <https://gym.openai.com/envs>`__. Custom env classes must take a single ``env_config`` parameter in their constructor:
 
 .. code-block:: python
 
     import ray
-    from ray.tune.registry import register_env
     from ray.rllib.agents import ppo
 
-    def env_creator(env_config):
-        import gym
-        return gym.make("CartPole-v0")  # or return your own custom env
+    class MyEnv(gym.Env):
+        def __init__(self, env_config):
+            self.action_space = ...
+            self.observation_space = ...
+        ...
 
-    register_env("my_env", env_creator)
     ray.init()
-    trainer = ppo.PPOAgent(env="my_env", config={
-        "env_config": {},  # config to pass to env creator
+    trainer = ppo.PPOAgent(env=MyEnv, config={
+        "env_config": {},  # config to pass to env class
     })
 
     while True:
         print(trainer.train())
 
+You can also register a custom env creator function with a string name. This function must take a single ``env_config`` parameter and return an env instance:
+
+.. code-block:: python
+
+    from ray.tune.registry import register_env
+
+    def env_creator(env_config):
+        return MyEnv(...)  # return an env instance
+
+    register_env("my_env", env_creator)
+    trainer = ppo.PPOAgent(env="my_env")
+
 Configuring Environments
 ------------------------
 
@@ -50,14 +81,14 @@ In the above example, note that the ``env_creator`` function takes in an ``env_c
 OpenAI Gym
 ----------
 
-RLlib uses Gym as its environment interface for single-agent training. For more information on how to implement a custom Gym environment, see the `gym.Env class definition <https://github.com/openai/gym/blob/master/gym/core.py>`__. You may also find the `SimpleCorridor <https://github.com/ray-project/ray/blob/master/examples/custom_env/custom_env.py>`__ and `Carla simulator <https://github.com/ray-project/ray/blob/master/examples/carla/env.py>`__ example env implementations useful as a reference.
+RLlib uses Gym as its environment interface for single-agent training. For more information on how to implement a custom Gym environment, see the `gym.Env class definition <https://github.com/openai/gym/blob/master/gym/core.py>`__. You may also find the `SimpleCorridor <https://github.com/ray-project/ray/blob/master/python/ray/rllib/examples/custom_env.py>`__ and `Carla simulator <https://github.com/ray-project/ray/blob/master/python/ray/rllib/examples/carla/env.py>`__ example env implementations useful as a reference.
 
 Performance
 ~~~~~~~~~~~
 
 There are two ways to scale experience collection with Gym environments:
 
-    1. **Vectorization within a single process:** Though many envs can very achieve high frame rates per core, their throughput is limited in practice by policy evaluation between steps. For example, even small TensorFlow models incur a couple milliseconds of latency to evaluate. This can be worked around by creating multiple envs per process and batching policy evaluations across these envs.
+    1. **Vectorization within a single process:** Though many envs can achieve high frame rates per core, their throughput is limited in practice by policy evaluation between steps. For example, even small TensorFlow models incur a couple milliseconds of latency to evaluate. This can be worked around by creating multiple envs per process and batching policy evaluations across these envs.
 
       You can configure ``{"num_envs_per_worker": M}`` to have RLlib create ``M`` concurrent environments per worker. RLlib auto-vectorizes Gym environments via `VectorEnv.wrap() <https://github.com/ray-project/ray/blob/master/python/ray/rllib/env/vector_env.py>`__.
 
@@ -76,6 +107,10 @@ RLlib will auto-vectorize Gym envs for batch evaluation if the ``num_envs_per_wo
 Multi-Agent
 -----------
 
+.. note::
+
+   Learn more about multi-agent reinforcement learning in RLlib by reading the `blog post <https://rise.cs.berkeley.edu/blog/scaling-multi-agent-rl-with-rllib/>`__.
+
 A multi-agent environment is one which has multiple acting entities per step, e.g., in a traffic simulation, there may be multiple "car" and "traffic light" agents in the environment. The model for multi-agent in RLlib as follows: (1) as a user you define the number of policies available up front, and (2) a function that maps agent ids to policy ids. This is summarized by the below figure:
 
 .. image:: multi-agent.svg
@@ -132,25 +167,93 @@ If all the agents will be using the same algorithm class to train, then you can
 
 RLlib will create three distinct policies and route agent decisions to its bound policy. When an agent first appears in the env, ``policy_mapping_fn`` will be called to determine which policy it is bound to. RLlib reports separate training statistics for each policy in the return from ``train()``, along with the combined reward.
 
-Here is a simple `example training script <https://github.com/ray-project/ray/blob/master/python/ray/rllib/examples/multiagent_cartpole.py>`__ in which you can vary the number of agents and policies in the environment. For how to use multiple training methods at once (here DQN and PPO), see the `two-trainer example <https://github.com/ray-project/ray/blob/master/python/ray/rllib/examples/multiagent_two_trainers.py>`__.
+Here is a simple `example training script <https://github.com/ray-project/ray/blob/master/python/ray/rllib/examples/multiagent_cartpole.py>`__ in which you can vary the number of agents and policies in the environment. For how to use multiple training methods at once (here DQN and PPO), see the `two-trainer example <https://github.com/ray-project/ray/blob/master/python/ray/rllib/examples/multiagent_two_trainers.py>`__. Metrics are reported for each policy separately, for example:
+
+.. code-block:: bash
+   :emphasize-lines: 6,14,22
+
+    Result for PPO_multi_cartpole_0:
+      episode_len_mean: 34.025862068965516
+      episode_reward_max: 159.0
+      episode_reward_mean: 86.06896551724138
+      info:
+        policy_0:
+          cur_lr: 4.999999873689376e-05
+          entropy: 0.6833480000495911
+          kl: 0.010264254175126553
+          policy_loss: -11.95590591430664
+          total_loss: 197.7039794921875
+          vf_explained_var: 0.0010995268821716309
+          vf_loss: 209.6578826904297
+        policy_1:
+          cur_lr: 4.999999873689376e-05
+          entropy: 0.6827034950256348
+          kl: 0.01119876280426979
+          policy_loss: -8.787769317626953
+          total_loss: 88.26161193847656
+          vf_explained_var: 0.0005457401275634766
+          vf_loss: 97.0471420288086
+      policy_reward_mean:
+        policy_0: 21.194444444444443
+        policy_1: 21.798387096774192
 
 To scale to hundreds of agents, MultiAgentEnv batches policy evaluations across multiple agents internally. It can also be auto-vectorized by setting ``num_envs_per_worker > 1``.
 
-Agent-Driven
-------------
+Variable-Sharing Between Policies
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-In many situations, it does not make sense for an environment to be "stepped" by RLlib. For example, if a policy is to be used in a web serving system, then it is more natural for an agent to query a service that serves policy decisions, and for that service to learn from experience over time.
+RLlib will create each policy's model in a separate ``tf.variable_scope``. However, variables can still be shared between policies by explicitly entering a globally shared variable scope with ``tf.VariableScope(reuse=tf.AUTO_REUSE)``:
 
-RLlib provides the `ServingEnv <https://github.com/ray-project/ray/blob/master/python/ray/rllib/env/serving_env.py>`__ class for this purpose. Unlike other envs, ServingEnv has its own thread of control. At any point, agents on that thread can query the current policy for decisions via ``self.get_action()`` and reports rewards via ``self.log_returns()``. This can be done for multiple concurrent episodes as well.
+.. code-block:: python
+
+        with tf.variable_scope(
+                tf.VariableScope(tf.AUTO_REUSE, "name_of_global_shared_scope"),
+                reuse=tf.AUTO_REUSE,
+                auxiliary_name_scope=False):
+            <create the shared layers here>
+
+There is a full example of this in the `example training script <https://github.com/ray-project/ray/blob/master/python/ray/rllib/examples/multiagent_cartpole.py>`__.
+
+Implementing a Centralized Critic
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Implementing a centralized critic that takes as input the observations and actions of other concurrent agents requires the definition of custom policy graphs. It can be done as follows:
+
+1. Querying the critic: this can be done in the ``postprocess_trajectory`` method of a custom policy graph, which has full access to the policies and observations of concurrent agents via the ``other_agent_batches`` and ``episode`` arguments. The batch of critic predictions can then be added to the postprocessed trajectory. Here's an example:
+
+.. code-block:: python
 
-For example, ServingEnv can be used to implement a simple REST policy `server <https://github.com/ray-project/ray/tree/master/python/ray/rllib/examples/serving>`__ that learns over time using RLlib. In this example RLlib runs with ``num_workers=0`` to avoid port allocation issues, but in principle this could be scaled by increasing ``num_workers``.
+    def postprocess_trajectory(self, sample_batch, other_agent_batches, episode):
+        agents = ["agent_1", "agent_2", "agent_3"]  # simple example of 3 agents
+        global_obs_batch = np.stack(
+            [other_agent_batches[agent_id][1]["obs"] for agent_id in agents],
+            axis=1)
+        # add the global obs and global critic value
+        sample_batch["global_obs"] = global_obs_batch
+        sample_batch["central_vf"] = self.sess.run(
+            self.critic_network, feed_dict={"obs": global_obs_batch})
+        return sample_batch
 
-Offline Data
-~~~~~~~~~~~~
+2. Updating the critic: the centralized critic loss can be added to the loss of the custom policy graph, the same as with any other value function. For an example of defining loss inputs, see the `PGPolicyGraph example <https://github.com/ray-project/ray/blob/master/python/ray/rllib/agents/pg/pg_policy_graph.py>`__.
 
-ServingEnv also provides a ``self.log_action()`` call to support off-policy actions. This allows the client to make independent decisions, e.g., to compare two different policies, and for RLlib to still learn from those off-policy actions. Note that this requires the algorithm used to support learning from off-policy decisions (e.g., DQN).
+Interfacing with External Agents
+--------------------------------
+
+In many situations, it does not make sense for an environment to be "stepped" by RLlib. For example, if a policy is to be used in a web serving system, then it is more natural for an agent to query a service that serves policy decisions, and for that service to learn from experience over time. This case also naturally arises with **external simulators** that run independently outside the control of RLlib, but may still want to leverage RLlib for training.
+
+RLlib provides the `ExternalEnv <https://github.com/ray-project/ray/blob/master/python/ray/rllib/env/external_env.py>`__ class for this purpose. Unlike other envs, ExternalEnv has its own thread of control. At any point, agents on that thread can query the current policy for decisions via ``self.get_action()`` and reports rewards via ``self.log_returns()``. This can be done for multiple concurrent episodes as well.
+
+ExternalEnv can be used to implement a simple REST policy `server <https://github.com/ray-project/ray/tree/master/python/ray/rllib/examples/serving>`__ that learns over time using RLlib. In this example RLlib runs with ``num_workers=0`` to avoid port allocation issues, but in principle this could be scaled by increasing ``num_workers``.
+
+Logging off-policy actions
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+ExternalEnv also provides a ``self.log_action()`` call to support off-policy actions. This allows the client to make independent decisions, e.g., to compare two different policies, and for RLlib to still learn from those off-policy actions. Note that this requires the algorithm used to support learning from off-policy decisions (e.g., DQN).
+
+Data ingest
+~~~~~~~~~~~
 
-The ``log_action`` API of ServingEnv can be used to ingest data from offline logs. The pattern would be as follows: First, some policy is followed to produce experience data which is stored in some offline storage system. Then, RLlib creates a number of workers that use a ServingEnv to read the logs in parallel and ingest the experiences. After a round of training completes, the new policy can be deployed to collect more experiences.
+The ``log_action`` API of ExternalEnv can be used to ingest data from offline logs. The pattern would be as follows: First, some policy is followed to produce experience data which is stored in some offline storage system. Then, RLlib creates a number of workers that use a ExternalEnv to read the logs in parallel and ingest the experiences. After a round of training completes, the new policy can be deployed to collect more experiences.
 
 Note that envs can read from different partitions of the logs based on the ``worker_index`` attribute of the `env context <https://github.com/ray-project/ray/blob/master/python/ray/rllib/env/env_context.py>`__ passed into the environment constructor.
 
diff --git a/doc/source/rllib-envs.svg b/doc/source/rllib-envs.svg
index 37d6d66e6e1e5..2cc45dbf96fa7 100644
--- a/doc/source/rllib-envs.svg
+++ b/doc/source/rllib-envs.svg
@@ -1 +1 @@
-<svg version="1.1" viewBox="0.0 0.0 2394.0 762.0" fill="none" stroke="none" stroke-linecap="square" stroke-miterlimit="10" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns="http://www.w3.org/2000/svg"><clipPath id="p.0"><path d="m0 0l2394.0 0l0 762.0l-2394.0 0l0 -762.0z" clip-rule="nonzero"/></clipPath><g clip-path="url(#p.0)"><path fill="#000000" fill-opacity="0.0" d="m0 0l2394.0 0l0 762.0l-2394.0 0z" fill-rule="evenodd"/><path fill="#d9ead3" d="m16.0 21.514435l536.9764 0l0 182.51968l-536.9764 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m16.0 21.514435l536.9764 0l0 182.51968l-536.9764 0z" fill-rule="evenodd"/><path fill="#000000" d="m32.085846 113.1199q0 -8.5625 4.59375 -13.390625q4.59375 -4.84375 11.859375 -4.84375q4.75 0 8.5625 2.28125q3.828125 2.265625 5.828125 6.328125q2.015625 4.0625 2.015625 9.21875q0 5.234375 -2.109375 9.359375q-2.109375 4.125 -5.984375 6.25q-3.859375 2.125 -8.34375 2.125q-4.84375 0 -8.671875 -2.34375q-3.8125 -2.359375 -5.78125 -6.40625q-1.96875 -4.0625 -1.96875 -8.578125zm4.6875 0.0625q0 6.21875 3.328125 9.796875q3.34375 3.5625 8.390625 3.5625q5.125 0 8.4375 -3.609375q3.328125 -3.609375 3.328125 -10.234375q0 -4.203125 -1.421875 -7.328125q-1.421875 -3.125 -4.15625 -4.84375q-2.71875 -1.734375 -6.125 -1.734375q-4.828125 0 -8.3125 3.328125q-3.46875 3.3125 -3.46875 11.0625zm33.492188 26.21875l0 -34.4375l3.84375 0l0 3.234375q1.359375 -1.90625 3.0625 -2.84375q1.71875 -0.953125 4.15625 -0.953125q3.1875 0 5.625 1.640625q2.4375 1.640625 3.671875 4.625q1.25 2.984375 1.25 6.546875q0 3.828125 -1.375 6.890625q-1.375 3.046875 -3.984375 4.6875q-2.609375 1.625 -5.5 1.625q-2.109375 0 -3.78125 -0.890625q-1.671875 -0.890625 -2.75 -2.25l0 12.125l-4.21875 0zm3.8125 -21.859375q0 4.8125 1.9375 7.109375q1.953125 2.296875 4.71875 2.296875q2.8125 0 4.8125 -2.375q2.015625 -2.390625 2.015625 -7.375q0 -4.765625 -1.96875 -7.125q-1.953125 -2.375 -4.671875 -2.375q-2.6875 0 -4.765625 2.53125q-2.078125 2.515625 -2.078125 7.3125zm39.914062 4.296875l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm23.445312 0l13.203125 -34.359375l4.90625 0l14.0625 34.359375l-5.1875 0l-4.0 -10.40625l-14.375 0l-3.765625 10.40625l-4.84375 0zm9.921875 -14.109375l11.65625 0l-3.59375 -9.515625q-1.640625 -4.34375 -2.4375 -7.125q-0.65625 3.296875 -1.84375 6.5625l-3.78125 10.078125zm26.65625 14.109375l0 -34.359375l4.546875 0l0 34.359375l-4.546875 0zm41.96875 -13.484375l0 -4.03125l14.5625 -0.015625l0 12.75q-3.359375 2.671875 -6.921875 4.03125q-3.5625 1.34375 -7.3125 1.34375q-5.0625 0 -9.203125 -2.171875q-4.125 -2.171875 -6.234375 -6.265625q-2.109375 -4.109375 -2.109375 -9.171875q0 -5.015625 2.09375 -9.359375q2.09375 -4.359375 6.03125 -6.46875q3.9375 -2.109375 9.078125 -2.109375q3.71875 0 6.734375 1.21875q3.015625 1.203125 4.71875 3.359375q1.71875 2.15625 2.609375 5.625l-4.109375 1.125q-0.765625 -2.625 -1.921875 -4.125q-1.140625 -1.5 -3.28125 -2.40625q-2.125 -0.90625 -4.734375 -0.90625q-3.109375 0 -5.390625 0.953125q-2.265625 0.953125 -3.671875 2.5q-1.390625 1.546875 -2.15625 3.390625q-1.3125 3.1875 -1.3125 6.921875q0 4.59375 1.578125 7.6875q1.578125 3.09375 4.59375 4.59375q3.03125 1.5 6.4375 1.5q2.953125 0 5.765625 -1.140625q2.8125 -1.140625 4.265625 -2.421875l0 -6.40625l-10.109375 0zm20.539062 23.078125l-0.46875 -3.96875q1.375 0.375 2.40625 0.375q1.40625 0 2.25 -0.46875q0.84375 -0.46875 1.390625 -1.3125q0.390625 -0.625 1.28125 -3.140625q0.125 -0.34375 0.375 -1.03125l-9.4375 -24.9375l4.546875 0l5.171875 14.40625q1.015625 2.75 1.8125 5.765625q0.71875 -2.90625 1.734375 -5.671875l5.3125 -14.5l4.21875 0l-9.46875 25.3125q-1.515625 4.109375 -2.359375 5.65625q-1.125 2.078125 -2.578125 3.046875q-1.453125 0.984375 -3.46875 0.984375q-1.21875 0 -2.71875 -0.515625zm24.1875 -9.59375l0 -24.890625l3.765625 0l0 3.484375q1.171875 -1.828125 3.109375 -2.9375q1.953125 -1.109375 4.4375 -1.109375q2.765625 0 4.53125 1.15625q1.78125 1.140625 2.5 3.203125q2.953125 -4.359375 7.6875 -4.359375q3.703125 0 5.6875 2.046875q2.0 2.046875 2.0 6.3125l0 17.09375l-4.1875 0l0 -15.6875q0 -2.53125 -0.421875 -3.640625q-0.40625 -1.109375 -1.484375 -1.78125q-1.078125 -0.6875 -2.53125 -0.6875q-2.625 0 -4.359375 1.75q-1.734375 1.734375 -1.734375 5.578125l0 14.46875l-4.21875 0l0 -16.171875q0 -2.8125 -1.03125 -4.21875q-1.03125 -1.40625 -3.375 -1.40625q-1.78125 0 -3.296875 0.9375q-1.5 0.9375 -2.1875 2.75q-0.671875 1.796875 -0.671875 5.1875l0 12.921875l-4.21875 0zm61.382812 10.109375q-3.5 -4.40625 -5.921875 -10.3125q-2.40625 -5.921875 -2.40625 -12.25q0 -5.578125 1.8125 -10.6875q2.109375 -5.921875 6.515625 -11.8125l3.015625 0q-2.828125 4.875 -3.75 6.96875q-1.421875 3.234375 -2.25 6.75q-1.0 4.375 -1.0 8.8125q0 11.265625 7.0 22.53125l-3.015625 0zm7.140625 -8.046875l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125zm23.789062 22.484375l-0.46875 -3.96875q1.375 0.375 2.40625 0.375q1.40625 0 2.25 -0.46875q0.84375 -0.46875 1.390625 -1.3125q0.390625 -0.625 1.28125 -3.140625q0.125 -0.34375 0.375 -1.03125l-9.4375 -24.9375l4.546875 0l5.171875 14.40625q1.015625 2.75 1.8125 5.765625q0.71875 -2.90625 1.734375 -5.671875l5.3125 -14.5l4.21875 0l-9.46875 25.3125q-1.515625 4.109375 -2.359375 5.65625q-1.125 2.078125 -2.578125 3.046875q-1.453125 0.984375 -3.46875 0.984375q-1.21875 0 -2.71875 -0.515625zm24.1875 -9.59375l0 -24.890625l3.765625 0l0 3.484375q1.171875 -1.828125 3.109375 -2.9375q1.953125 -1.109375 4.4375 -1.109375q2.765625 0 4.53125 1.15625q1.78125 1.140625 2.5 3.203125q2.953125 -4.359375 7.6875 -4.359375q3.703125 0 5.6875 2.046875q2.0 2.046875 2.0 6.3125l0 17.09375l-4.1875 0l0 -15.6875q0 -2.53125 -0.421875 -3.640625q-0.40625 -1.109375 -1.484375 -1.78125q-1.078125 -0.6875 -2.53125 -0.6875q-2.625 0 -4.359375 1.75q-1.734375 1.734375 -1.734375 5.578125l0 14.46875l-4.21875 0l0 -16.171875q0 -2.8125 -1.03125 -4.21875q-1.03125 -1.40625 -3.375 -1.40625q-1.78125 0 -3.296875 0.9375q-1.5 0.9375 -2.1875 2.75q-0.671875 1.796875 -0.671875 5.1875l0 12.921875l-4.21875 0zm41.171875 0l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm12.7734375 0l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.390625 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.5780945 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9374695 0zm19.859344 10.109375l-3.03125 0q7.015625 -11.265625 7.015625 -22.53125q0 -4.40625 -1.015625 -8.75q-0.796875 -3.515625 -2.21875 -6.75q-0.921875 -2.109375 -3.78125 -7.03125l3.03125 0q4.40625 5.890625 6.515625 11.8125q1.796875 5.109375 1.796875 10.6875q0 6.328125 -2.421875 12.25q-2.421875 5.90625 -5.890625 10.3125z" fill-rule="nonzero"/><path fill="#d9ead3" d="m608.9227 21.514435l603.874 0l0 182.51968l-603.874 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m608.9227 21.514435l603.874 0l0 182.51968l-603.874 0z" fill-rule="evenodd"/><path fill="#000000" d="m793.0394 100.85428l0 -34.359375l6.84375 0l8.140625 24.328125q1.125 3.390625 1.640625 5.078125q0.578125 -1.875 1.828125 -5.5l8.21875 -23.90625l6.125 0l0 34.359375l-4.390625 0l0 -28.765625l-9.984375 28.765625l-4.09375 0l-9.9375 -29.25l0 29.25l-4.390625 0zm55.90625 0l0 -3.65625q-2.90625 4.21875 -7.90625 4.21875q-2.203125 0 -4.109375 -0.84375q-1.90625 -0.84375 -2.84375 -2.125q-0.921875 -1.28125 -1.296875 -3.125q-0.25 -1.25 -0.25 -3.9375l0 -15.421875l4.21875 0l0 13.796875q0 3.3125 0.25 4.453125q0.40625 1.671875 1.6875 2.625q1.296875 0.9375 3.1875 0.9375q1.90625 0 3.5625 -0.96875q1.671875 -0.96875 2.359375 -2.640625q0.6875 -1.6875 0.6875 -4.875l0 -13.328125l4.21875 0l0 24.890625l-3.765625 0zm10.2890625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm19.960938 -3.78125l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm4.1484375 -25.734375l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm9.0078125 -10.3125l0 -4.25l12.953125 0l0 4.25l-12.953125 0zm14.375 10.3125l13.203125 -34.359375l4.90625 0l14.0625 34.359375l-5.1875 0l-4.0 -10.40625l-14.375 0l-3.765625 10.40625l-4.84375 0zm9.921875 -14.109375l11.65625 0l-3.59375 -9.515625q-1.640625 -4.34375 -2.4375 -7.125q-0.65625 3.296875 -1.84375 6.5625l-3.78125 10.078125zm24.5625 16.171875l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125zm41.007812 4.875l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm35.898438 -3.78125l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875z" fill-rule="nonzero"/><path fill="#000000" d="m661.99646 168.96365q-3.5 -4.40625 -5.921875 -10.3125q-2.40625 -5.921875 -2.40625 -12.25q0 -5.578125 1.8125 -10.6875q2.109375 -5.921875 6.515625 -11.8125l3.015625 0q-2.828125 4.875 -3.75 6.96875q-1.421875 3.234375 -2.25 6.75q-1.0 4.375 -1.0 8.8125q0 11.265625 7.0 22.53125l-3.015625 0zm7.875 -10.109375l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm15.9375 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.6640625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.7734375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm14.5390625 0l-3.921875 0l0 -34.359375l4.21875 0l0 12.25q2.671875 -3.34375 6.828125 -3.34375q2.296875 0 4.34375 0.921875q2.046875 0.921875 3.375 2.609375q1.328125 1.671875 2.078125 4.046875q0.75 2.359375 0.75 5.046875q0 6.40625 -3.171875 9.90625q-3.15625 3.484375 -7.59375 3.484375q-4.40625 0 -6.90625 -3.6875l0 3.125zm-0.046875 -12.640625q0 4.484375 1.21875 6.46875q1.984375 3.265625 5.390625 3.265625q2.765625 0 4.78125 -2.40625q2.015625 -2.40625 2.015625 -7.15625q0 -4.875 -1.9375 -7.1875q-1.9375 -2.328125 -4.671875 -2.328125q-2.765625 0 -4.78125 2.40625q-2.015625 2.390625 -2.015625 6.9375zm24.039062 12.640625l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm29.179688 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm18.28125 0l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm12.5390625 0l0 -34.359375l6.84375 0l8.140625 24.328125q1.125 3.390625 1.640625 5.078125q0.578125 -1.875 1.828125 -5.5l8.21875 -23.90625l6.125 0l0 34.359375l-4.390625 0l0 -28.765625l-9.984375 28.765625l-4.09375 0l-9.9375 -29.25l0 29.25l-4.390625 0zm55.90625 0l0 -3.65625q-2.90625 4.21875 -7.90625 4.21875q-2.203125 0 -4.109375 -0.84375q-1.90625 -0.84375 -2.84375 -2.125q-0.921875 -1.28125 -1.296875 -3.125q-0.25 -1.25 -0.25 -3.9375l0 -15.421875l4.21875 0l0 13.796875q0 3.3125 0.25 4.453125q0.40625 1.671875 1.6875 2.625q1.296875 0.9375 3.1875 0.9375q1.90625 0 3.5625 -0.96875q1.671875 -0.96875 2.359375 -2.640625q0.6875 -1.6875 0.6875 -4.875l0 -13.328125l4.21875 0l0 24.890625l-3.765625 0zm10.2890625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm19.960938 -3.78125l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm4.1484375 -25.734375l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm7.3984375 0l13.203125 -34.359375l4.90625 0l14.0625 34.359375l-5.1875 0l-4.0 -10.40625l-14.375 0l-3.765625 10.40625l-4.84375 0zm9.921875 -14.109375l11.65625 0l-3.59375 -9.515625q-1.640625 -4.34375 -2.4375 -7.125q-0.65625 3.296875 -1.84375 6.5625l-3.78125 10.078125zm24.5625 16.171875l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125zm41.007812 4.875l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm35.898438 -3.78125l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm4.7578125 3.78125l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.390625 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm19.859375 10.109375l-3.03125 0q7.015625 -11.265625 7.015625 -22.53125q0 -4.40625 -1.015625 -8.75q-0.796875 -3.515625 -2.21875 -6.75q-0.921875 -2.109375 -3.78125 -7.03125l3.03125 0q4.40625 5.890625 6.515625 11.8125q1.796875 5.109375 1.796875 10.6875q0 6.328125 -2.421875 12.25q-2.421875 5.90625 -5.890625 10.3125z" fill-rule="nonzero"/><path fill="#d9ead3" d="m1838.2983 21.514435l502.26782 0l0 182.51968l-502.26782 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m1838.2983 21.514435l502.26782 0l0 182.51968l-502.26782 0z" fill-rule="evenodd"/><path fill="#000000" d="m1878.4908 100.85428l0 -34.359375l15.234375 0q4.59375 0 6.984375 0.921875q2.390625 0.921875 3.8125 3.265625q1.4375 2.34375 1.4375 5.1875q0 3.65625 -2.375 6.171875q-2.359375 2.5 -7.3125 3.171875q1.8125 0.875 2.75 1.71875q1.984375 1.828125 3.765625 4.5625l5.984375 9.359375l-5.71875 0l-4.546875 -7.15625q-2.0 -3.09375 -3.296875 -4.734375q-1.28125 -1.640625 -2.296875 -2.296875q-1.015625 -0.65625 -2.078125 -0.90625q-0.765625 -0.171875 -2.53125 -0.171875l-5.265625 0l0 15.265625l-4.546875 0zm4.546875 -19.203125l9.765625 0q3.125 0 4.875 -0.640625q1.765625 -0.640625 2.671875 -2.0625q0.921875 -1.421875 0.921875 -3.078125q0 -2.4375 -1.78125 -4.0q-1.765625 -1.578125 -5.578125 -1.578125l-10.875 0l0 11.359375zm30.132812 19.203125l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm30.375 -11.046875l4.296875 -0.375q0.296875 2.578125 1.40625 4.234375q1.125 1.65625 3.46875 2.671875q2.34375 1.015625 5.265625 1.015625q2.609375 0 4.59375 -0.765625q2.0 -0.78125 2.96875 -2.125q0.96875 -1.34375 0.96875 -2.9375q0 -1.625 -0.9375 -2.828125q-0.9375 -1.203125 -3.09375 -2.03125q-1.375 -0.53125 -6.109375 -1.671875q-4.734375 -1.140625 -6.640625 -2.140625q-2.453125 -1.296875 -3.671875 -3.203125q-1.203125 -1.90625 -1.203125 -4.28125q0 -2.59375 1.46875 -4.859375q1.484375 -2.265625 4.3125 -3.4375q2.84375 -1.171875 6.3125 -1.171875q3.828125 0 6.734375 1.234375q2.921875 1.234375 4.484375 3.625q1.578125 2.390625 1.703125 5.40625l-4.359375 0.328125q-0.359375 -3.25 -2.390625 -4.90625q-2.015625 -1.671875 -5.984375 -1.671875q-4.125 0 -6.015625 1.515625q-1.875 1.5 -1.875 3.640625q0 1.84375 1.328125 3.046875q1.3125 1.1875 6.859375 2.453125q5.546875 1.25 7.609375 2.1875q3.0 1.375 4.421875 3.5q1.4375 2.125 1.4375 4.890625q0 2.734375 -1.578125 5.171875q-1.5625 2.421875 -4.515625 3.78125q-2.9375 1.34375 -6.609375 1.34375q-4.671875 0 -7.828125 -1.359375q-3.140625 -1.375 -4.9375 -4.09375q-1.796875 -2.734375 -1.890625 -6.1875zm42.3125 11.046875l0 -30.3125l-11.328125 0l0 -4.046875l27.234375 0l0 4.046875l-11.359375 0l0 30.3125l-4.546875 0zm30.125 0l13.203125 -34.359375l4.90625 0l14.062378 34.359375l-5.187378 0l-4.0 -10.40625l-14.375 0l-3.765625 10.40625l-4.84375 0zm9.921875 -14.109375l11.65625 0l-3.59375 -9.515625q-1.640625 -4.34375 -2.4375 -7.125q-0.65625 3.296875 -1.84375 6.5625l-3.78125 10.078125zm25.874878 14.109375l0 -34.359375l12.96875 0q3.421875 0 5.21875 0.328125q2.53125 0.421875 4.234375 1.609375q1.71875 1.171875 2.765625 3.3125q1.046875 2.125 1.046875 4.6875q0 4.375 -2.796875 7.421875q-2.78125 3.03125 -10.078125 3.03125l-8.8125 0l0 13.96875l-4.546875 0zm4.546875 -18.03125l8.890625 0q4.40625 0 6.25 -1.640625q1.859375 -1.640625 1.859375 -4.609375q0 -2.15625 -1.09375 -3.6875q-1.09375 -1.546875 -2.875 -2.03125q-1.140625 -0.3125 -4.234375 -0.3125l-8.796875 0l0 12.28125zm28.25 18.03125l0 -34.359375l4.546875 0l0 34.359375l-4.546875 0zm26.359375 0l0 -21.609375l-3.71875 0l0 -3.28125l3.71875 0l0 -2.65625q0 -2.5 0.453125 -3.71875q0.609375 -1.640625 2.140625 -2.65625q1.53125 -1.03125 4.296875 -1.03125q1.78125 0 3.9375 0.421875l-0.625 3.6875q-1.3125 -0.234375 -2.484375 -0.234375q-1.921875 0 -2.71875 0.828125q-0.796875 0.8125 -0.796875 3.0625l0 2.296875l4.84375 0l0 3.28125l-4.84375 0l0 21.609375l-4.203125 0zm10.7578125 -12.453125q0 -6.90625 3.84375 -10.234375q3.21875 -2.765625 7.828125 -2.765625q5.140625 0 8.390625 3.359375q3.265625 3.359375 3.265625 9.296875q0 4.796875 -1.453125 7.5625q-1.4375 2.75 -4.1875 4.28125q-2.75 1.515625 -6.015625 1.515625q-5.21875 0 -8.453125 -3.34375q-3.21875 -3.359375 -3.21875 -9.671875zm4.34375 0q0 4.78125 2.078125 7.171875q2.09375 2.375 5.25 2.375q3.140625 0 5.21875 -2.390625q2.09375 -2.390625 2.09375 -7.296875q0 -4.609375 -2.09375 -6.984375q-2.09375 -2.390625 -5.21875 -2.390625q-3.15625 0 -5.25 2.375q-2.078125 2.359375 -2.078125 7.140625zm23.882812 12.453125l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm29.898438 0l0 -34.359375l12.96875 0q3.421875 0 5.21875 0.328125q2.53125 0.421875 4.234375 1.609375q1.71875 1.171875 2.765625 3.3125q1.046875 2.125 1.046875 4.6875q0 4.375 -2.796875 7.421875q-2.78125 3.03125 -10.078125 3.03125l-8.8125 0l0 13.96875l-4.546875 0zm4.546875 -18.03125l8.890625 0q4.40625 0 6.25 -1.640625q1.859375 -1.640625 1.859375 -4.609375q0 -2.15625 -1.09375 -3.6875q-1.09375 -1.546875 -2.875 -2.03125q-1.140625 -0.3125 -4.234375 -0.3125l-8.796875 0l0 12.28125zm25.359375 5.578125q0 -6.90625 3.84375 -10.234375q3.21875 -2.765625 7.828125 -2.765625q5.140625 0 8.390625 3.359375q3.265625 3.359375 3.265625 9.296875q0 4.796875 -1.453125 7.5625q-1.4375 2.75 -4.1875 4.28125q-2.75 1.515625 -6.015625 1.515625q-5.21875 0 -8.453125 -3.34375q-3.21875 -3.359375 -3.21875 -9.671875zm4.34375 0q0 4.78125 2.078125 7.171875q2.09375 2.375 5.25 2.375q3.140625 0 5.21875 -2.390625q2.09375 -2.390625 2.09375 -7.296875q0 -4.609375 -2.09375 -6.984375q-2.09375 -2.390625 -5.21875 -2.390625q-3.15625 0 -5.25 2.375q-2.078125 2.359375 -2.078125 7.140625zm23.835938 12.453125l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.7734375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm26.882812 -9.125l4.15625 0.546875q-0.6875 4.28125 -3.484375 6.71875q-2.796875 2.421875 -6.875 2.421875q-5.109375 0 -8.21875 -3.34375q-3.109375 -3.34375 -3.109375 -9.578125q0 -4.03125 1.328125 -7.046875q1.34375 -3.03125 4.078125 -4.53125q2.734375 -1.515625 5.9375 -1.515625q4.0625 0 6.640625 2.046875q2.578125 2.046875 3.296875 5.828125l-4.09375 0.625q-0.59375 -2.5 -2.078125 -3.765625q-1.484375 -1.265625 -3.59375 -1.265625q-3.1875 0 -5.1875 2.28125q-1.984375 2.28125 -1.984375 7.234375q0 5.015625 1.921875 7.296875q1.921875 2.265625 5.015625 2.265625q2.484375 0 4.140625 -1.515625q1.671875 -1.53125 2.109375 -4.703125zm7.578125 18.71875l-0.46875 -3.96875q1.375 0.375 2.40625 0.375q1.40625 0 2.25 -0.46875q0.84375 -0.46875 1.390625 -1.3125q0.390625 -0.625 1.28125 -3.140625q0.125 -0.34375 0.375 -1.03125l-9.4375 -24.9375l4.546875 0l5.171875 14.40625q1.015625 2.75 1.8125 5.765625q0.71875 -2.90625 1.734375 -5.671875l5.3125 -14.5l4.21875 0l-9.46875 25.3125q-1.515625 4.109375 -2.359375 5.65625q-1.125 2.078125 -2.578125 3.046875q-1.453125 0.984375 -3.46875 0.984375q-1.21875 0 -2.71875 -0.515625z" fill-rule="nonzero"/><path fill="#000000" d="m2010.2135 147.8074l4.296875 -0.375q0.296875 2.578125 1.40625 4.234375q1.125 1.65625 3.46875 2.671875q2.34375 1.015625 5.265625 1.015625q2.609375 0 4.59375 -0.765625q2.0 -0.78125 2.96875 -2.125q0.96875 -1.34375 0.96875 -2.9375q0 -1.625 -0.9375 -2.828125q-0.9375 -1.203125 -3.09375 -2.03125q-1.375 -0.53125 -6.109375 -1.671875q-4.734375 -1.140625 -6.640625 -2.140625q-2.453125 -1.296875 -3.671875 -3.203125q-1.203125 -1.90625 -1.203125 -4.28125q0 -2.59375 1.46875 -4.859375q1.484375 -2.265625 4.3125 -3.4375q2.84375 -1.171875 6.3125 -1.171875q3.828125 0 6.734375 1.234375q2.921875 1.234375 4.484375 3.625q1.578125 2.390625 1.703125 5.40625l-4.359375 0.328125q-0.359375 -3.25 -2.390625 -4.90625q-2.015625 -1.671875 -5.984375 -1.671875q-4.125 0 -6.015625 1.515625q-1.875 1.5 -1.875 3.640625q0 1.84375 1.328125 3.046875q1.3125 1.1875 6.859375 2.453125q5.546875 1.25 7.609375 2.1875q3.0 1.375 4.421875 3.5q1.4375 2.125 1.4375 4.890625q0 2.734375 -1.578125 5.171875q-1.5625 2.421875 -4.515625 3.78125q-2.9375 1.34375 -6.609375 1.34375q-4.671875 0 -7.828125 -1.359375q-3.140625 -1.375 -4.9375 -4.09375q-1.796875 -2.734375 -1.890625 -6.1875zm50.062378 3.03125l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671753 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234253 -3.46875 8.390503 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.562378 0q0.234375 4.109375 2.312378 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.843628 -6.828125l13.890503 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.9842529 1.9375 -2.187378 5.1875zm23.460815 14.84375l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm22.9375 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm17.109375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm10.6484375 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm25.914062 2.0625l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125z" fill-rule="nonzero"/><path fill="#d9ead3" d="m1268.7451 21.514435l481.6062 0l0 182.51968l-481.6062 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m1268.7451 21.514435l481.6062 0l0 182.51968l-481.6062 0z" fill-rule="evenodd"/><path fill="#000000" d="m1331.6224 89.8074l4.296875 -0.375q0.296875 2.578125 1.40625 4.234375q1.125 1.65625 3.46875 2.671875q2.34375 1.015625 5.265625 1.015625q2.609375 0 4.59375 -0.765625q2.0 -0.78125 2.96875 -2.125q0.96875 -1.34375 0.96875 -2.9375q0 -1.625 -0.9375 -2.828125q-0.9375 -1.203125 -3.09375 -2.03125q-1.375 -0.53125 -6.109375 -1.671875q-4.734375 -1.140625 -6.640625 -2.140625q-2.453125 -1.296875 -3.671875 -3.203125q-1.203125 -1.90625 -1.203125 -4.28125q0 -2.59375 1.46875 -4.859375q1.484375 -2.265625 4.3125 -3.4375q2.84375 -1.171875 6.3125 -1.171875q3.828125 0 6.734375 1.234375q2.921875 1.234375 4.484375 3.625q1.578125 2.390625 1.703125 5.40625l-4.359375 0.328125q-0.359375 -3.25 -2.390625 -4.90625q-2.015625 -1.671875 -5.984375 -1.671875q-4.125 0 -6.015625 1.515625q-1.875 1.5 -1.875 3.640625q0 1.84375 1.328125 3.046875q1.3125 1.1875 6.859375 2.453125q5.546875 1.25 7.609375 2.1875q3.0 1.375 4.421875 3.5q1.4375 2.125 1.4375 4.890625q0 2.734375 -1.578125 5.171875q-1.5625 2.421875 -4.515625 3.78125q-2.9375 1.34375 -6.609375 1.34375q-4.671875 0 -7.828125 -1.359375q-3.140625 -1.375 -4.9375 -4.09375q-1.796875 -2.734375 -1.890625 -6.1875zm50.0625 3.03125l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.460938 14.84375l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm22.9375 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm17.109375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm10.6484375 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm25.914062 2.0625l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125zm56.953125 8.828125q-2.09375 2.328125 -4.5625 3.5q-2.453125 1.15625 -5.3125 1.15625q-5.265625 0 -8.359375 -3.578125q-2.515625 -2.90625 -2.515625 -6.484375q0 -3.1875 2.046875 -5.75q2.0625 -2.578125 6.140625 -4.515625q-2.328125 -2.671875 -3.109375 -4.328125q-0.765625 -1.671875 -0.765625 -3.21875q0 -3.09375 2.421875 -5.375q2.4375 -2.296875 6.109375 -2.296875q3.515625 0 5.75 2.15625q2.25 2.15625 2.25 5.1875q0 4.890625 -6.5 8.359375l6.171875 7.859375q1.046875 -2.0625 1.640625 -4.78125l4.375 0.9375q-1.125 4.5 -3.046875 7.40625q2.375 3.140625 5.375 5.265625l-2.84375 3.359375q-2.546875 -1.640625 -5.265625 -4.859375zm-8.578125 -17.90625q2.734375 -1.609375 3.546875 -2.828125q0.8125 -1.21875 0.8125 -2.703125q0 -1.75 -1.125 -2.859375q-1.109375 -1.125 -2.765625 -1.125q-1.71875 0 -2.859375 1.109375q-1.125 1.09375 -1.125 2.6875q0 0.796875 0.40625 1.6875q0.40625 0.875 1.234375 1.859375l1.875 2.171875zm5.921875 14.578125l-7.734375 -9.578125q-3.421875 2.03125 -4.625 3.78125q-1.1875 1.75 -1.1875 3.453125q0 2.09375 1.65625 4.34375q1.671875 2.25 4.71875 2.25q1.90625 0 3.921875 -1.1875q2.03125 -1.1875 3.25 -3.0625zm27.523438 -9.34375q0 -8.5625 4.59375 -13.390625q4.59375 -4.84375 11.859375 -4.84375q4.75 0 8.5625 2.28125q3.828125 2.265625 5.828125 6.328125q2.015625 4.0625 2.015625 9.21875q0 5.234375 -2.109375 9.359375q-2.109375 4.125 -5.984375 6.25q-3.859375 2.125 -8.34375 2.125q-4.84375 0 -8.671875 -2.34375q-3.8125 -2.359375 -5.78125 -6.40625q-1.96875 -4.0625 -1.96875 -8.578125zm4.6875 0.0625q0 6.21875 3.328125 9.796875q3.34375 3.5625 8.390625 3.5625q5.125 0 8.4375 -3.609375q3.328125 -3.609375 3.328125 -10.234375q0 -4.203125 -1.421875 -7.328125q-1.421875 -3.125 -4.15625 -4.84375q-2.71875 -1.734375 -6.125 -1.734375q-4.828125 0 -8.3125 3.328125q-3.46875 3.3125 -3.46875 11.0625zm34.492188 16.671875l0 -21.609375l-3.71875 0l0 -3.28125l3.71875 0l0 -2.65625q0 -2.5 0.453125 -3.71875q0.609375 -1.640625 2.140625 -2.65625q1.53125 -1.03125 4.296875 -1.03125q1.78125 0 3.9375 0.421875l-0.625 3.6875q-1.3125 -0.234375 -2.484375 -0.234375q-1.921875 0 -2.71875 0.828125q-0.796875 0.8125 -0.796875 3.0625l0 2.296875l4.84375 0l0 3.28125l-4.84375 0l0 21.609375l-4.203125 0zm13.3359375 0l0 -21.609375l-3.71875 0l0 -3.28125l3.71875 0l0 -2.65625q0 -2.5 0.453125 -3.71875q0.609375 -1.640625 2.140625 -2.65625q1.53125 -1.03125 4.296875 -1.03125q1.78125 0 3.9375 0.421875l-0.625 3.6875q-1.3125 -0.234375 -2.484375 -0.234375q-1.921875 0 -2.71875 0.828125q-0.796875 0.8125 -0.796875 3.0625l0 2.296875l4.84375 0l0 3.28125l-4.84375 0l0 21.609375l-4.203125 0zm12.2421875 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.7734375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm10.6484375 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm43.726562 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875z" fill-rule="nonzero"/><path fill="#000000" d="m1292.7006 168.96365q-3.5 -4.40625 -5.921875 -10.3125q-2.40625 -5.921875 -2.40625 -12.25q0 -5.578125 1.8125 -10.6875q2.109375 -5.921875 6.515625 -11.8125l3.015625 0q-2.828125 4.875 -3.75 6.96875q-1.421875 3.234375 -2.25 6.75q-1.0 4.375 -1.0 8.8125q0 11.265625 7.0 22.53125l-3.015625 0zm7.875 -10.109375l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm15.9375 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.6640625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.7734375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm14.5390625 0l-3.921875 0l0 -34.359375l4.21875 0l0 12.25q2.671875 -3.34375 6.828125 -3.34375q2.296875 0 4.34375 0.921875q2.046875 0.921875 3.375 2.609375q1.328125 1.671875 2.078125 4.046875q0.75 2.359375 0.75 5.046875q0 6.40625 -3.171875 9.90625q-3.15625 3.484375 -7.59375 3.484375q-4.40625 0 -6.90625 -3.6875l0 3.125zm-0.046875 -12.640625q0 4.484375 1.21875 6.46875q1.984375 3.265625 5.390625 3.265625q2.765625 0 4.78125 -2.40625q2.015625 -2.40625 2.015625 -7.15625q0 -4.875 -1.9375 -7.1875q-1.9375 -2.328125 -4.671875 -2.328125q-2.765625 0 -4.78125 2.40625q-2.015625 2.390625 -2.015625 6.9375zm24.039062 12.640625l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm29.179688 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm18.28125 0l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm11.1328125 -11.046875l4.296875 -0.375q0.296875 2.578125 1.40625 4.234375q1.125 1.65625 3.46875 2.671875q2.34375 1.015625 5.265625 1.015625q2.609375 0 4.59375 -0.765625q2.0 -0.78125 2.96875 -2.125q0.96875 -1.34375 0.96875 -2.9375q0 -1.625 -0.9375 -2.828125q-0.9375 -1.203125 -3.09375 -2.03125q-1.375 -0.53125 -6.109375 -1.671875q-4.734375 -1.140625 -6.640625 -2.140625q-2.453125 -1.296875 -3.671875 -3.203125q-1.203125 -1.90625 -1.203125 -4.28125q0 -2.59375 1.46875 -4.859375q1.484375 -2.265625 4.3125 -3.4375q2.84375 -1.171875 6.3125 -1.171875q3.828125 0 6.734375 1.234375q2.921875 1.234375 4.484375 3.625q1.578125 2.390625 1.703125 5.40625l-4.359375 0.328125q-0.359375 -3.25 -2.390625 -4.90625q-2.015625 -1.671875 -5.984375 -1.671875q-4.125 0 -6.015625 1.515625q-1.875 1.5 -1.875 3.640625q0 1.84375 1.328125 3.046875q1.3125 1.1875 6.859375 2.453125q5.546875 1.25 7.609375 2.1875q3.0 1.375 4.421875 3.5q1.4375 2.125 1.4375 4.890625q0 2.734375 -1.578125 5.171875q-1.5625 2.421875 -4.515625 3.78125q-2.9375 1.34375 -6.609375 1.34375q-4.671875 0 -7.828125 -1.359375q-3.140625 -1.375 -4.9375 -4.09375q-1.796875 -2.734375 -1.890625 -6.1875zm50.0625 3.03125l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.460938 14.84375l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm22.9375 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm17.109375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm10.6484375 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm25.914062 2.0625l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125zm24.601562 12.890625l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.390625 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm19.859375 10.109375l-3.03125 0q7.015625 -11.265625 7.015625 -22.53125q0 -4.40625 -1.015625 -8.75q-0.796875 -3.515625 -2.21875 -6.75q-0.921875 -2.109375 -3.78125 -7.03125l3.03125 0q4.40625 5.890625 6.515625 11.8125q1.796875 5.109375 1.796875 10.6875q0 6.328125 -2.421875 12.25q-2.421875 5.90625 -5.890625 10.3125z" fill-rule="nonzero"/><path fill="#93c47d" d="m968.8479 561.48553l603.874 0l0 182.51971l-603.874 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m968.8479 561.48553l603.874 0l0 182.51971l-603.874 0z" fill-rule="evenodd"/><path fill="#000000" d="m1008.4685 669.8254l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm15.9375 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.6640625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.7734375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm14.5390625 0l-3.921875 0l0 -34.359375l4.21875 0l0 12.25q2.671875 -3.34375 6.828125 -3.34375q2.296875 0 4.34375 0.921875q2.046875 0.921875 3.375 2.609375q1.328125 1.671875 2.078125 4.046875q0.75 2.359375 0.75 5.046875q0 6.40625 -3.171875 9.90625q-3.15625 3.484375 -7.59375 3.484375q-4.40625 0 -6.90625 -3.6875l0 3.125zm-0.046875 -12.640625q0 4.484375 1.21875 6.46875q1.984375 3.265625 5.390625 3.265625q2.765625 0 4.78125 -2.40625q2.015625 -2.40625 2.015625 -7.15625q0 -4.875 -1.9375 -7.1875q-1.9375 -2.328125 -4.671875 -2.328125q-2.765625 0 -4.78125 2.40625q-2.015625 2.390625 -2.015625 6.9375zm24.039062 12.640625l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm29.179688 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm18.28125 0l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm8.8984375 0l13.203125 -34.359375l4.90625 0l14.0625 34.359375l-5.1875 0l-4.0 -10.40625l-14.375 0l-3.765625 10.40625l-4.84375 0zm9.921875 -14.109375l11.65625 0l-3.59375 -9.515625q-1.640625 -4.34375 -2.4375 -7.125q-0.65625 3.296875 -1.84375 6.5625l-3.78125 10.078125zm23.65625 6.671875l4.171875 -0.65625q0.34375 2.515625 1.953125 3.859375q1.609375 1.328125 4.484375 1.328125q2.90625 0 4.3125 -1.1875q1.40625 -1.1875 1.40625 -2.78125q0 -1.421875 -1.234375 -2.25q-0.875 -0.5625 -4.3125 -1.421875q-4.640625 -1.171875 -6.4375 -2.03125q-1.796875 -0.859375 -2.71875 -2.359375q-0.921875 -1.515625 -0.921875 -3.34375q0 -1.671875 0.75 -3.078125q0.765625 -1.421875 2.078125 -2.359375q0.984375 -0.734375 2.6875 -1.234375q1.703125 -0.5 3.640625 -0.5q2.9375 0 5.140625 0.84375q2.21875 0.84375 3.265625 2.28125q1.0625 1.4375 1.46875 3.859375l-4.125 0.5625q-0.28125 -1.921875 -1.640625 -3.0q-1.34375 -1.078125 -3.796875 -1.078125q-2.90625 0 -4.15625 0.96875q-1.234375 0.953125 -1.234375 2.234375q0 0.828125 0.515625 1.484375q0.515625 0.671875 1.609375 1.125q0.640625 0.234375 3.734375 1.078125q4.46875 1.1875 6.234375 1.953125q1.78125 0.765625 2.78125 2.21875q1.015625 1.453125 1.015625 3.609375q0 2.109375 -1.234375 3.96875q-1.234375 1.859375 -3.5625 2.890625q-2.3125 1.015625 -5.234375 1.015625q-4.859375 0 -7.40625 -2.015625q-2.53125 -2.015625 -3.234375 -5.984375zm25.5 17.03125l-0.46875 -3.96875q1.375 0.375 2.40625 0.375q1.40625 0 2.25 -0.46875q0.84375 -0.46875 1.390625 -1.3125q0.390625 -0.625 1.28125 -3.140625q0.125 -0.34375 0.375 -1.03125l-9.4375 -24.9375l4.546875 0l5.171875 14.40625q1.015625 2.75 1.8125 5.765625q0.71875 -2.90625 1.734375 -5.671875l5.3125 -14.5l4.21875 0l-9.46875 25.3125q-1.515625 4.109375 -2.359375 5.65625q-1.125 2.078125 -2.578125 3.046875q-1.453125 0.984375 -3.46875 0.984375q-1.21875 0 -2.71875 -0.515625zm24.1875 -9.59375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm42.929688 -9.125l4.15625 0.546875q-0.6875 4.28125 -3.484375 6.71875q-2.796875 2.421875 -6.875 2.421875q-5.109375 0 -8.21875 -3.34375q-3.109375 -3.34375 -3.109375 -9.578125q0 -4.03125 1.328125 -7.046875q1.34375 -3.03125 4.078125 -4.53125q2.734375 -1.515625 5.9375 -1.515625q4.0625 0 6.640625 2.046875q2.578125 2.046875 3.296875 5.828125l-4.09375 0.625q-0.59375 -2.5 -2.078125 -3.765625q-1.484375 -1.265625 -3.59375 -1.265625q-3.1875 0 -5.1875 2.28125q-1.984375 2.28125 -1.984375 7.234375q0 5.015625 1.921875 7.296875q1.921875 2.265625 5.015625 2.265625q2.484375 0 4.140625 -1.515625q1.671875 -1.53125 2.109375 -4.703125zm18.125 9.125l-13.3125 -34.359375l4.921875 0l8.921875 24.953125q1.078125 3.0 1.8125 5.625q0.796875 -2.8125 1.84375 -5.625l9.28125 -24.953125l4.640625 0l-13.453125 34.359375l-4.65625 0zm38.6875 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm39.742188 5.71875l4.15625 0.546875q-0.6875 4.28125 -3.484375 6.71875q-2.796875 2.421875 -6.875 2.421875q-5.109375 0 -8.21875 -3.34375q-3.109375 -3.34375 -3.109375 -9.578125q0 -4.03125 1.328125 -7.046875q1.34375 -3.03125 4.078125 -4.53125q2.734375 -1.515625 5.9375 -1.515625q4.0625 0 6.640625 2.046875q2.578125 2.046875 3.296875 5.828125l-4.09375 0.625q-0.59375 -2.5 -2.078125 -3.765625q-1.484375 -1.265625 -3.59375 -1.265625q-3.1875 0 -5.1875 2.28125q-1.984375 2.28125 -1.984375 7.234375q0 5.015625 1.921875 7.296875q1.921875 2.265625 5.015625 2.265625q2.484375 0 4.140625 -1.515625q1.671875 -1.53125 2.109375 -4.703125zm16.96875 5.34375l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm2.5546875 -8.671875q0 -6.90625 3.84375 -10.234375q3.21875 -2.765625 7.828125 -2.765625q5.140625 0 8.390625 3.359375q3.265625 3.359375 3.265625 9.296875q0 4.796875 -1.453125 7.5625q-1.4375 2.75 -4.1875 4.28125q-2.75 1.515625 -6.015625 1.515625q-5.21875 0 -8.453125 -3.34375q-3.21875 -3.359375 -3.21875 -9.671875zm4.34375 0q0 4.78125 2.078125 7.171875q2.09375 2.375 5.25 2.375q3.140625 0 5.21875 -2.390625q2.09375 -2.390625 2.09375 -7.296875q0 -4.609375 -2.09375 -6.984375q-2.09375 -2.390625 -5.21875 -2.390625q-3.15625 0 -5.25 2.375q-2.078125 2.359375 -2.078125 7.140625zm23.882812 12.453125l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm16.65625 0l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.390625 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0z" fill-rule="nonzero"/><path fill="#b6d7a8" d="m208.77705 378.96588l603.874 0l0 182.51965l-603.874 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m208.77705 378.96588l603.874 0l0 182.51965l-603.874 0z" fill-rule="evenodd"/><path fill="#000000" d="m313.75314 487.30573l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm15.9375 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.6640625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.7734375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm14.5390625 0l-3.921875 0l0 -34.359375l4.21875 0l0 12.25q2.671875 -3.34375 6.828125 -3.34375q2.296875 0 4.34375 0.921875q2.046875 0.921875 3.375 2.609375q1.328125 1.671875 2.078125 4.046875q0.75 2.359375 0.75 5.046875q0 6.40625 -3.171875 9.90625q-3.15625 3.484375 -7.59375 3.484375q-4.40625 0 -6.90625 -3.6875l0 3.125zm-0.046875 -12.640625q0 4.484375 1.21875 6.46875q1.984375 3.265625 5.390625 3.265625q2.765625 0 4.78125 -2.40625q2.015625 -2.40625 2.015625 -7.15625q0 -4.875 -1.9375 -7.1875q-1.9375 -2.328125 -4.671875 -2.328125q-2.765625 0 -4.78125 2.40625q-2.015625 2.390625 -2.015625 6.9375zm24.039062 12.640625l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm29.179688 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm18.28125 0l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm22.507812 0l-13.3125 -34.359375l4.921875 0l8.921875 24.953125q1.078125 3.0 1.8125 5.625q0.796875 -2.8125 1.84375 -5.625l9.2812195 -24.953125l4.640625 0l-13.4530945 34.359375l-4.65625 0zm38.68747 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm39.742188 5.71875l4.15625 0.546875q-0.6875 4.28125 -3.484375 6.71875q-2.796875 2.421875 -6.875 2.421875q-5.109375 0 -8.21875 -3.34375q-3.109375 -3.34375 -3.109375 -9.578125q0 -4.03125 1.328125 -7.046875q1.34375 -3.03125 4.078125 -4.53125q2.734375 -1.515625 5.9375 -1.515625q4.0625 0 6.640625 2.046875q2.578125 2.046875 3.296875 5.828125l-4.09375 0.625q-0.59375 -2.5 -2.078125 -3.765625q-1.484375 -1.265625 -3.59375 -1.265625q-3.1875 0 -5.1875 2.28125q-1.984375 2.28125 -1.984375 7.234375q0 5.015625 1.921875 7.296875q1.921875 2.265625 5.015625 2.265625q2.484375 0 4.140625 -1.515625q1.671875 -1.53125 2.109375 -4.703125zm16.96875 5.34375l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm2.5546875 -8.671875q0 -6.90625 3.84375 -10.234375q3.21875 -2.765625 7.828125 -2.765625q5.140625 0 8.390625 3.359375q3.265625 3.359375 3.265625 9.296875q0 4.796875 -1.453125 7.5625q-1.4375 2.75 -4.1875 4.28125q-2.75 1.515625 -6.015625 1.515625q-5.21875 0 -8.453125 -3.34375q-3.21875 -3.359375 -3.21875 -9.671875zm4.34375 0q0 4.78125 2.078125 7.171875q2.09375 2.375 5.25 2.375q3.140625 0 5.21875 -2.390625q2.09375 -2.390625 2.09375 -7.296875q0 -4.609375 -2.09375 -6.984375q-2.09375 -2.390625 -5.21875 -2.390625q-3.15625 0 -5.25 2.375q-2.078125 2.359375 -2.078125 7.140625zm23.882812 12.453125l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm16.65625 0l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.390625 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0z" fill-rule="nonzero"/><path fill="#b7b7b7" d="m1767.1183 327.02756l603.8739 0l0 182.51968l-603.8739 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m1767.1183 327.02756l603.8739 0l0 182.51968l-603.8739 0z" fill-rule="evenodd"/><path fill="#000000" d="m1864.4694 406.3674l0 -34.359375l12.890625 0q3.9375 0 6.3125 1.046875q2.390625 1.03125 3.734375 3.203125q1.34375 2.171875 1.34375 4.53125q0 2.203125 -1.203125 4.15625q-1.1875 1.9375 -3.59375 3.140625q3.109375 0.90625 4.78125 3.109375q1.6875 2.203125 1.6875 5.203125q0 2.421875 -1.03125 4.5q-1.015625 2.0625 -2.515625 3.1875q-1.5 1.125 -3.765625 1.703125q-2.25 0.578125 -5.53125 0.578125l-13.109375 0zm4.546875 -19.921875l7.4375 0q3.015625 0 4.328125 -0.40625q1.734375 -0.515625 2.609375 -1.703125q0.890625 -1.203125 0.890625 -3.0q0 -1.71875 -0.828125 -3.015625q-0.8125 -1.296875 -2.34375 -1.78125q-1.515625 -0.484375 -5.21875 -0.484375l-6.875 0l0 10.390625zm0 15.859375l8.5625 0q2.203125 0 3.09375 -0.15625q1.5625 -0.28125 2.609375 -0.9375q1.0625 -0.65625 1.734375 -1.90625q0.6875 -1.265625 0.6875 -2.90625q0 -1.921875 -0.984375 -3.328125q-0.984375 -1.421875 -2.734375 -2.0q-1.734375 -0.578125 -5.015625 -0.578125l-7.953125 0l0 11.8125zm43.359375 0.984375q-2.34375 2.0 -4.515625 2.828125q-2.15625 0.8125 -4.640625 0.8125q-4.109375 0 -6.3125 -2.0q-2.203125 -2.015625 -2.203125 -5.125q0 -1.828125 0.828125 -3.34375q0.84375 -1.515625 2.1875 -2.421875q1.34375 -0.921875 3.03125 -1.390625q1.25 -0.328125 3.75 -0.625q5.109375 -0.609375 7.53125 -1.453125q0.015625 -0.875 0.015625 -1.109375q0 -2.578125 -1.1875 -3.625q-1.625 -1.4375 -4.8125 -1.4375q-2.96875 0 -4.390625 1.046875q-1.421875 1.046875 -2.09375 3.6875l-4.125 -0.5625q0.5625 -2.640625 1.84375 -4.265625q1.296875 -1.640625 3.734375 -2.515625q2.4375 -0.875 5.640625 -0.875q3.1875 0 5.171875 0.75q2.0 0.75 2.9375 1.890625q0.9375 1.125 1.3125 2.859375q0.21875 1.078125 0.21875 3.890625l0 5.625q0 5.890625 0.265625 7.453125q0.265625 1.546875 1.0625 2.984375l-4.40625 0q-0.65625 -1.3125 -0.84375 -3.078125zm-0.34375 -9.421875q-2.296875 0.9375 -6.890625 1.59375q-2.609375 0.375 -3.6875 0.84375q-1.078125 0.46875 -1.671875 1.375q-0.578125 0.90625 -0.578125 2.0q0 1.6875 1.28125 2.8125q1.28125 1.125 3.734375 1.125q2.4375 0 4.328125 -1.0625q1.90625 -1.0625 2.796875 -2.921875q0.6875 -1.421875 0.6875 -4.21875l0 -1.546875zm20.007812 8.71875l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm20.367188 -5.34375l4.15625 0.546875q-0.6875 4.28125 -3.484375 6.71875q-2.796875 2.421875 -6.875 2.421875q-5.109375 0 -8.21875 -3.34375q-3.109375 -3.34375 -3.109375 -9.578125q0 -4.03125 1.328125 -7.046875q1.34375 -3.03125 4.078125 -4.53125q2.734375 -1.515625 5.9375 -1.515625q4.0625 0 6.640625 2.046875q2.578125 2.046875 3.296875 5.828125l-4.09375 0.625q-0.59375 -2.5 -2.078125 -3.765625q-1.484375 -1.265625 -3.59375 -1.265625q-3.1875 0 -5.1875 2.28125q-1.984375 2.28125 -1.984375 7.234375q0 5.015625 1.921875 7.296875q1.921875 2.265625 5.015625 2.265625q2.484375 0 4.140625 -1.515625q1.671875 -1.53125 2.109375 -4.703125zm7.765625 9.125l0 -34.359375l4.21875 0l0 12.328125q2.953125 -3.421875 7.453125 -3.421875q2.765625 0 4.796875 1.09375q2.046875 1.078125 2.921875 3.0q0.875 1.921875 0.875 5.578125l0 15.78125l-4.21875 0l0 -15.78125q0 -3.15625 -1.375 -4.59375q-1.359375 -1.453125 -3.875 -1.453125q-1.875 0 -3.53125 0.984375q-1.640625 0.96875 -2.34375 2.640625q-0.703125 1.65625 -0.703125 4.578125l0 13.625l-4.21875 0zm43.726562 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm39.648438 14.84375l0 -3.140625q-2.359375 3.703125 -6.953125 3.703125q-2.984375 0 -5.484375 -1.640625q-2.484375 -1.640625 -3.859375 -4.578125q-1.375 -2.953125 -1.375 -6.765625q0 -3.734375 1.234375 -6.765625q1.25 -3.03125 3.734375 -4.640625q2.484375 -1.625 5.5625 -1.625q2.25 0 4.0 0.953125q1.765625 0.9375 2.859375 2.46875l0 -12.328125l4.203125 0l0 34.359375l-3.921875 0zm-13.328125 -12.421875q0 4.78125 2.015625 7.15625q2.015625 2.359375 4.75 2.359375q2.765625 0 4.703125 -2.265625q1.9375 -2.265625 1.9375 -6.90625q0 -5.109375 -1.96875 -7.5q-1.96875 -2.390625 -4.859375 -2.390625q-2.8125 0 -4.703125 2.296875q-1.875 2.296875 -1.875 7.25zm36.203003 1.375l4.296875 -0.375q0.296875 2.578125 1.40625 4.234375q1.125 1.65625 3.46875 2.671875q2.34375 1.015625 5.265625 1.015625q2.609375 0 4.59375 -0.765625q2.0 -0.78125 2.96875 -2.125q0.96875 -1.34375 0.96875 -2.9375q0 -1.625 -0.9375 -2.828125q-0.9375 -1.203125 -3.09375 -2.03125q-1.375 -0.53125 -6.109375 -1.671875q-4.734375 -1.140625 -6.640625 -2.140625q-2.453125 -1.296875 -3.671875 -3.203125q-1.203125 -1.90625 -1.203125 -4.28125q0 -2.59375 1.46875 -4.859375q1.484375 -2.265625 4.3125 -3.4375q2.84375 -1.171875 6.3125 -1.171875q3.828125 0 6.734375 1.234375q2.921875 1.234375 4.484375 3.625q1.578125 2.390625 1.703125 5.40625l-4.359375 0.328125q-0.359375 -3.25 -2.390625 -4.90625q-2.015625 -1.671875 -5.984375 -1.671875q-4.125 0 -6.015625 1.515625q-1.875 1.5 -1.875 3.640625q0 1.84375 1.328125 3.046875q1.3125 1.1875 6.859375 2.453125q5.546875 1.25 7.609375 2.1875q3.0 1.375 4.421875 3.5q1.4375 2.125 1.4375 4.890625q0 2.734375 -1.578125 5.171875q-1.5625 2.421875 -4.515625 3.78125q-2.9375 1.34375 -6.609375 1.34375q-4.671875 0 -7.828125 -1.359375q-3.140625 -1.375 -4.9375 -4.09375q-1.796875 -2.734375 -1.890625 -6.1875zm33.046875 -18.46875l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm10.6484375 0l0 -24.890625l3.765625 0l0 3.484375q1.171875 -1.828125 3.109375 -2.9375q1.953125 -1.109375 4.4375 -1.109375q2.765625 0 4.53125 1.15625q1.78125 1.140625 2.5 3.203125q2.953125 -4.359375 7.6875 -4.359375q3.703125 0 5.6875 2.046875q2.0 2.046875 2.0 6.3125l0 17.09375l-4.1875 0l0 -15.6875q0 -2.53125 -0.421875 -3.640625q-0.40625 -1.109375 -1.484375 -1.78125q-1.078125 -0.6875 -2.53125 -0.6875q-2.625 0 -4.359375 1.75q-1.734375 1.734375 -1.734375 5.578125l0 14.46875l-4.21875 0l0 -16.171875q0 -2.8125 -1.03125 -4.21875q-1.03125 -1.40625 -3.375 -1.40625q-1.78125 0 -3.296875 0.9375q-1.5 0.9375 -2.1875 2.75q-0.671875 1.796875 -0.671875 5.1875l0 12.921875l-4.21875 0zm56.296875 0l0 -3.65625q-2.90625 4.21875 -7.90625 4.21875q-2.203125 0 -4.109375 -0.84375q-1.90625 -0.84375 -2.84375 -2.125q-0.921875 -1.28125 -1.296875 -3.125q-0.25 -1.25 -0.25 -3.9375l0 -15.421875l4.21875 0l0 13.796875q0 3.3125 0.25 4.453125q0.40625 1.671875 1.6875 2.625q1.296875 0.9375 3.1875 0.9375q1.90625 0 3.5625 -0.96875q1.671875 -0.96875 2.359375 -2.640625q0.6875 -1.6875 0.6875 -4.875l0 -13.328125l4.21875 0l0 24.890625l-3.765625 0zm10.2890625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm26.992188 -3.078125q-2.34375 2.0 -4.515625 2.828125q-2.15625 0.8125 -4.640625 0.8125q-4.109375 0 -6.3125 -2.0q-2.203125 -2.015625 -2.203125 -5.125q0 -1.828125 0.828125 -3.34375q0.84375 -1.515625 2.1875 -2.421875q1.34375 -0.921875 3.03125 -1.390625q1.25 -0.328125 3.75 -0.625q5.109375 -0.609375 7.53125 -1.453125q0.015625 -0.875 0.015625 -1.109375q0 -2.578125 -1.1875 -3.625q-1.625 -1.4375 -4.8125 -1.4375q-2.96875 0 -4.390625 1.046875q-1.421875 1.046875 -2.09375 3.6875l-4.125 -0.5625q0.5625 -2.640625 1.84375 -4.265625q1.296875 -1.640625 3.734375 -2.515625q2.4375 -0.875 5.640625 -0.875q3.1875 0 5.171875 0.75q2.0 0.75 2.9375 1.890625q0.9375 1.125 1.3125 2.859375q0.21875 1.078125 0.21875 3.890625l0 5.625q0 5.890625 0.265625 7.453125q0.265625 1.546875 1.0625 2.984375l-4.40625 0q-0.65625 -1.3125 -0.84375 -3.078125zm-0.34375 -9.421875q-2.296875 0.9375 -6.890625 1.59375q-2.609375 0.375 -3.6875 0.84375q-1.078125 0.46875 -1.671875 1.375q-0.578125 0.90625 -0.578125 2.0q0 1.6875 1.28125 2.8125q1.28125 1.125 3.734375 1.125q2.4375 0 4.328125 -1.0625q1.90625 -1.0625 2.796875 -2.921875q0.6875 -1.421875 0.6875 -4.21875l0 -1.546875zm20.007812 8.71875l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm2.5546875 -8.671875q0 -6.90625 3.84375 -10.234375q3.21875 -2.765625 7.828125 -2.765625q5.140625 0 8.390625 3.359375q3.265625 3.359375 3.265625 9.296875q0 4.796875 -1.453125 7.5625q-1.4375 2.75 -4.1875 4.28125q-2.75 1.515625 -6.015625 1.515625q-5.21875 0 -8.453125 -3.34375q-3.21875 -3.359375 -3.21875 -9.671875zm4.34375 0q0 4.78125 2.078125 7.171875q2.09375 2.375 5.25 2.375q3.140625 0 5.21875 -2.390625q2.09375 -2.390625 2.09375 -7.296875q0 -4.609375 -2.09375 -6.984375q-2.09375 -2.390625 -5.21875 -2.390625q-3.15625 0 -5.25 2.375q-2.078125 2.359375 -2.078125 7.140625zm23.882812 12.453125l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm14.34375 -7.4375l4.171875 -0.65625q0.34375 2.515625 1.953125 3.859375q1.609375 1.328125 4.484375 1.328125q2.90625 0 4.3125 -1.1875q1.40625 -1.1875 1.40625 -2.78125q0 -1.421875 -1.234375 -2.25q-0.875 -0.5625 -4.3125 -1.421875q-4.640625 -1.171875 -6.4375 -2.03125q-1.796875 -0.859375 -2.71875 -2.359375q-0.921875 -1.515625 -0.921875 -3.34375q0 -1.671875 0.75 -3.078125q0.765625 -1.421875 2.078125 -2.359375q0.984375 -0.734375 2.6875 -1.234375q1.703125 -0.5 3.640625 -0.5q2.9375 0 5.140625 0.84375q2.21875 0.84375 3.265625 2.28125q1.0625 1.4375 1.46875 3.859375l-4.125 0.5625q-0.28125 -1.921875 -1.640625 -3.0q-1.34375 -1.078125 -3.796875 -1.078125q-2.90625 0 -4.15625 0.96875q-1.234375 0.953125 -1.234375 2.234375q0 0.828125 0.515625 1.484375q0.515625 0.671875 1.609375 1.125q0.640625 0.234375 3.734375 1.078125q4.46875 1.1875 6.234375 1.953125q1.78125 0.765625 2.78125 2.21875q1.015625 1.453125 1.015625 3.609375q0 2.109375 -1.234375 3.96875q-1.234375 1.859375 -3.5625 2.890625q-2.3125 1.015625 -5.234375 1.015625q-4.859375 0 -7.40625 -2.015625q-2.53125 -2.015625 -3.234375 -5.984375z" fill-rule="nonzero"/><path fill="#000000" d="m1966.9225 474.47678q-3.5 -4.40625 -5.921875 -10.3125q-2.40625 -5.921875 -2.40625 -12.25q0 -5.578125 1.8125 -10.6875q2.109375 -5.921875 6.515625 -11.8125l3.015625 0q-2.828125 4.875 -3.75 6.96875q-1.421875 3.234375 -2.25 6.75q-1.0 4.375 -1.0 8.8125q0 11.265625 7.0 22.53125l-3.015625 0zm24.953125 -18.125l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm24.695312 14.84375l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm11.3671875 2.0625l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125zm25.164062 12.890625l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm13.242065 0l0 -4.8125l4.8125 0l0 4.8125q0 2.65625 -0.9375 4.28125q-0.9375 1.625 -2.984375 2.515625l-1.171875 -1.796875q1.34375 -0.59375 1.96875 -1.734375q0.640625 -1.125 0.703125 -3.265625l-2.390625 0zm26.203125 0l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.734375 0l0 -34.359375l4.546875 0l0 30.296875l16.921875 0l0 4.0625l-21.46875 0zm27.117188 0l0 -34.359375l23.1875 0l0 4.046875l-18.640625 0l0 10.640625l16.125 0l0 4.0625l-16.125 0l0 15.609375l-4.546875 0zm31.320312 10.109375l-3.03125 0q7.015625 -11.265625 7.015625 -22.53125q0 -4.40625 -1.015625 -8.75q-0.796875 -3.515625 -2.21875 -6.75q-0.921875 -2.109375 -3.78125 -7.03125l3.03125 0q4.40625 5.890625 6.515625 11.8125q1.796875 5.109375 1.796875 10.6875q0 6.328125 -2.421875 12.25q-2.421875 5.90625 -5.890625 10.3125z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m284.4882 204.03412l226.2362 174.92914" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m284.4882 204.03412l188.26349 145.56808" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m464.6689 360.05566l36.803436 11.753754l-20.637909 -32.660675z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m812.65106 470.2257l458.14178 91.275635" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m812.65106 470.2257l411.06696 81.89685" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m1221.1361 565.0818l38.18689 -5.8656006l-33.023193 -20.052734z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m910.85974 204.03412l359.937 357.4488" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m910.85974 204.03412l325.87842 323.6256" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m1227.427 537.0357l35.07129 16.206177l-16.448975 -34.95813z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m1509.5482 204.03412l-238.7716 357.4488" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m1509.5482 204.03412l-212.1095 317.5348" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m1286.4508 514.2291l-9.1779785 37.528748l31.153809 -22.849182z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m1838.2983 112.77428l-87.93701 0" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m1838.2983 112.77428l-39.93701 0" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m1798.3613 99.56042l-36.304688 13.21386l36.304688 13.21386z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m1767.1183 418.2874l-496.34644 143.21259" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m1767.1183 418.2874l-450.22778 129.90582" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m1313.2273 535.49725l-31.218628 22.76056l38.545044 2.6313477z" fill-rule="evenodd"/></g></svg>
\ No newline at end of file
+<svg version="1.1" viewBox="0.0 0.0 2394.0 762.0" fill="none" stroke="none" stroke-linecap="square" stroke-miterlimit="10" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns="http://www.w3.org/2000/svg"><clipPath id="p.0"><path d="m0 0l2394.0 0l0 762.0l-2394.0 0l0 -762.0z" clip-rule="nonzero"/></clipPath><g clip-path="url(#p.0)"><path fill="#000000" fill-opacity="0.0" d="m0 0l2394.0 0l0 762.0l-2394.0 0z" fill-rule="evenodd"/><path fill="#d9ead3" d="m16.0 21.514435l536.9764 0l0 182.51968l-536.9764 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m16.0 21.514435l536.9764 0l0 182.51968l-536.9764 0z" fill-rule="evenodd"/><path fill="#000000" d="m32.085846 113.1199q0 -8.5625 4.59375 -13.390625q4.59375 -4.84375 11.859375 -4.84375q4.75 0 8.5625 2.28125q3.828125 2.265625 5.828125 6.328125q2.015625 4.0625 2.015625 9.21875q0 5.234375 -2.109375 9.359375q-2.109375 4.125 -5.984375 6.25q-3.859375 2.125 -8.34375 2.125q-4.84375 0 -8.671875 -2.34375q-3.8125 -2.359375 -5.78125 -6.40625q-1.96875 -4.0625 -1.96875 -8.578125zm4.6875 0.0625q0 6.21875 3.328125 9.796875q3.34375 3.5625 8.390625 3.5625q5.125 0 8.4375 -3.609375q3.328125 -3.609375 3.328125 -10.234375q0 -4.203125 -1.421875 -7.328125q-1.421875 -3.125 -4.15625 -4.84375q-2.71875 -1.734375 -6.125 -1.734375q-4.828125 0 -8.3125 3.328125q-3.46875 3.3125 -3.46875 11.0625zm33.492188 26.21875l0 -34.4375l3.84375 0l0 3.234375q1.359375 -1.90625 3.0625 -2.84375q1.71875 -0.953125 4.15625 -0.953125q3.1875 0 5.625 1.640625q2.4375 1.640625 3.671875 4.625q1.25 2.984375 1.25 6.546875q0 3.828125 -1.375 6.890625q-1.375 3.046875 -3.984375 4.6875q-2.609375 1.625 -5.5 1.625q-2.109375 0 -3.78125 -0.890625q-1.671875 -0.890625 -2.75 -2.25l0 12.125l-4.21875 0zm3.8125 -21.859375q0 4.8125 1.9375 7.109375q1.953125 2.296875 4.71875 2.296875q2.8125 0 4.8125 -2.375q2.015625 -2.390625 2.015625 -7.375q0 -4.765625 -1.96875 -7.125q-1.953125 -2.375 -4.671875 -2.375q-2.6875 0 -4.765625 2.53125q-2.078125 2.515625 -2.078125 7.3125zm39.914062 4.296875l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm23.445312 0l13.203125 -34.359375l4.90625 0l14.0625 34.359375l-5.1875 0l-4.0 -10.40625l-14.375 0l-3.765625 10.40625l-4.84375 0zm9.921875 -14.109375l11.65625 0l-3.59375 -9.515625q-1.640625 -4.34375 -2.4375 -7.125q-0.65625 3.296875 -1.84375 6.5625l-3.78125 10.078125zm26.65625 14.109375l0 -34.359375l4.546875 0l0 34.359375l-4.546875 0zm41.96875 -13.484375l0 -4.03125l14.5625 -0.015625l0 12.75q-3.359375 2.671875 -6.921875 4.03125q-3.5625 1.34375 -7.3125 1.34375q-5.0625 0 -9.203125 -2.171875q-4.125 -2.171875 -6.234375 -6.265625q-2.109375 -4.109375 -2.109375 -9.171875q0 -5.015625 2.09375 -9.359375q2.09375 -4.359375 6.03125 -6.46875q3.9375 -2.109375 9.078125 -2.109375q3.71875 0 6.734375 1.21875q3.015625 1.203125 4.71875 3.359375q1.71875 2.15625 2.609375 5.625l-4.109375 1.125q-0.765625 -2.625 -1.921875 -4.125q-1.140625 -1.5 -3.28125 -2.40625q-2.125 -0.90625 -4.734375 -0.90625q-3.109375 0 -5.390625 0.953125q-2.265625 0.953125 -3.671875 2.5q-1.390625 1.546875 -2.15625 3.390625q-1.3125 3.1875 -1.3125 6.921875q0 4.59375 1.578125 7.6875q1.578125 3.09375 4.59375 4.59375q3.03125 1.5 6.4375 1.5q2.953125 0 5.765625 -1.140625q2.8125 -1.140625 4.265625 -2.421875l0 -6.40625l-10.109375 0zm20.539062 23.078125l-0.46875 -3.96875q1.375 0.375 2.40625 0.375q1.40625 0 2.25 -0.46875q0.84375 -0.46875 1.390625 -1.3125q0.390625 -0.625 1.28125 -3.140625q0.125 -0.34375 0.375 -1.03125l-9.4375 -24.9375l4.546875 0l5.171875 14.40625q1.015625 2.75 1.8125 5.765625q0.71875 -2.90625 1.734375 -5.671875l5.3125 -14.5l4.21875 0l-9.46875 25.3125q-1.515625 4.109375 -2.359375 5.65625q-1.125 2.078125 -2.578125 3.046875q-1.453125 0.984375 -3.46875 0.984375q-1.21875 0 -2.71875 -0.515625zm24.1875 -9.59375l0 -24.890625l3.765625 0l0 3.484375q1.171875 -1.828125 3.109375 -2.9375q1.953125 -1.109375 4.4375 -1.109375q2.765625 0 4.53125 1.15625q1.78125 1.140625 2.5 3.203125q2.953125 -4.359375 7.6875 -4.359375q3.703125 0 5.6875 2.046875q2.0 2.046875 2.0 6.3125l0 17.09375l-4.1875 0l0 -15.6875q0 -2.53125 -0.421875 -3.640625q-0.40625 -1.109375 -1.484375 -1.78125q-1.078125 -0.6875 -2.53125 -0.6875q-2.625 0 -4.359375 1.75q-1.734375 1.734375 -1.734375 5.578125l0 14.46875l-4.21875 0l0 -16.171875q0 -2.8125 -1.03125 -4.21875q-1.03125 -1.40625 -3.375 -1.40625q-1.78125 0 -3.296875 0.9375q-1.5 0.9375 -2.1875 2.75q-0.671875 1.796875 -0.671875 5.1875l0 12.921875l-4.21875 0zm61.382812 10.109375q-3.5 -4.40625 -5.921875 -10.3125q-2.40625 -5.921875 -2.40625 -12.25q0 -5.578125 1.8125 -10.6875q2.109375 -5.921875 6.515625 -11.8125l3.015625 0q-2.828125 4.875 -3.75 6.96875q-1.421875 3.234375 -2.25 6.75q-1.0 4.375 -1.0 8.8125q0 11.265625 7.0 22.53125l-3.015625 0zm7.140625 -8.046875l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125zm23.789062 22.484375l-0.46875 -3.96875q1.375 0.375 2.40625 0.375q1.40625 0 2.25 -0.46875q0.84375 -0.46875 1.390625 -1.3125q0.390625 -0.625 1.28125 -3.140625q0.125 -0.34375 0.375 -1.03125l-9.4375 -24.9375l4.546875 0l5.171875 14.40625q1.015625 2.75 1.8125 5.765625q0.71875 -2.90625 1.734375 -5.671875l5.3125 -14.5l4.21875 0l-9.46875 25.3125q-1.515625 4.109375 -2.359375 5.65625q-1.125 2.078125 -2.578125 3.046875q-1.453125 0.984375 -3.46875 0.984375q-1.21875 0 -2.71875 -0.515625zm24.1875 -9.59375l0 -24.890625l3.765625 0l0 3.484375q1.171875 -1.828125 3.109375 -2.9375q1.953125 -1.109375 4.4375 -1.109375q2.765625 0 4.53125 1.15625q1.78125 1.140625 2.5 3.203125q2.953125 -4.359375 7.6875 -4.359375q3.703125 0 5.6875 2.046875q2.0 2.046875 2.0 6.3125l0 17.09375l-4.1875 0l0 -15.6875q0 -2.53125 -0.421875 -3.640625q-0.40625 -1.109375 -1.484375 -1.78125q-1.078125 -0.6875 -2.53125 -0.6875q-2.625 0 -4.359375 1.75q-1.734375 1.734375 -1.734375 5.578125l0 14.46875l-4.21875 0l0 -16.171875q0 -2.8125 -1.03125 -4.21875q-1.03125 -1.40625 -3.375 -1.40625q-1.78125 0 -3.296875 0.9375q-1.5 0.9375 -2.1875 2.75q-0.671875 1.796875 -0.671875 5.1875l0 12.921875l-4.21875 0zm41.171875 0l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm12.7734375 0l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.390625 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.5780945 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9374695 0zm19.859344 10.109375l-3.03125 0q7.015625 -11.265625 7.015625 -22.53125q0 -4.40625 -1.015625 -8.75q-0.796875 -3.515625 -2.21875 -6.75q-0.921875 -2.109375 -3.78125 -7.03125l3.03125 0q4.40625 5.890625 6.515625 11.8125q1.796875 5.109375 1.796875 10.6875q0 6.328125 -2.421875 12.25q-2.421875 5.90625 -5.890625 10.3125z" fill-rule="nonzero"/><path fill="#d9ead3" d="m608.9227 21.514435l603.874 0l0 182.51968l-603.874 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m608.9227 21.514435l603.874 0l0 182.51968l-603.874 0z" fill-rule="evenodd"/><path fill="#000000" d="m793.0394 100.85428l0 -34.359375l6.84375 0l8.140625 24.328125q1.125 3.390625 1.640625 5.078125q0.578125 -1.875 1.828125 -5.5l8.21875 -23.90625l6.125 0l0 34.359375l-4.390625 0l0 -28.765625l-9.984375 28.765625l-4.09375 0l-9.9375 -29.25l0 29.25l-4.390625 0zm55.90625 0l0 -3.65625q-2.90625 4.21875 -7.90625 4.21875q-2.203125 0 -4.109375 -0.84375q-1.90625 -0.84375 -2.84375 -2.125q-0.921875 -1.28125 -1.296875 -3.125q-0.25 -1.25 -0.25 -3.9375l0 -15.421875l4.21875 0l0 13.796875q0 3.3125 0.25 4.453125q0.40625 1.671875 1.6875 2.625q1.296875 0.9375 3.1875 0.9375q1.90625 0 3.5625 -0.96875q1.671875 -0.96875 2.359375 -2.640625q0.6875 -1.6875 0.6875 -4.875l0 -13.328125l4.21875 0l0 24.890625l-3.765625 0zm10.2890625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm19.960938 -3.78125l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm4.1484375 -25.734375l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm9.0078125 -10.3125l0 -4.25l12.953125 0l0 4.25l-12.953125 0zm14.375 10.3125l13.203125 -34.359375l4.90625 0l14.0625 34.359375l-5.1875 0l-4.0 -10.40625l-14.375 0l-3.765625 10.40625l-4.84375 0zm9.921875 -14.109375l11.65625 0l-3.59375 -9.515625q-1.640625 -4.34375 -2.4375 -7.125q-0.65625 3.296875 -1.84375 6.5625l-3.78125 10.078125zm24.5625 16.171875l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125zm41.007812 4.875l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm35.898438 -3.78125l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875z" fill-rule="nonzero"/><path fill="#000000" d="m661.99646 168.96365q-3.5 -4.40625 -5.921875 -10.3125q-2.40625 -5.921875 -2.40625 -12.25q0 -5.578125 1.8125 -10.6875q2.109375 -5.921875 6.515625 -11.8125l3.015625 0q-2.828125 4.875 -3.75 6.96875q-1.421875 3.234375 -2.25 6.75q-1.0 4.375 -1.0 8.8125q0 11.265625 7.0 22.53125l-3.015625 0zm7.875 -10.109375l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm15.9375 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.6640625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.7734375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm14.5390625 0l-3.921875 0l0 -34.359375l4.21875 0l0 12.25q2.671875 -3.34375 6.828125 -3.34375q2.296875 0 4.34375 0.921875q2.046875 0.921875 3.375 2.609375q1.328125 1.671875 2.078125 4.046875q0.75 2.359375 0.75 5.046875q0 6.40625 -3.171875 9.90625q-3.15625 3.484375 -7.59375 3.484375q-4.40625 0 -6.90625 -3.6875l0 3.125zm-0.046875 -12.640625q0 4.484375 1.21875 6.46875q1.984375 3.265625 5.390625 3.265625q2.765625 0 4.78125 -2.40625q2.015625 -2.40625 2.015625 -7.15625q0 -4.875 -1.9375 -7.1875q-1.9375 -2.328125 -4.671875 -2.328125q-2.765625 0 -4.78125 2.40625q-2.015625 2.390625 -2.015625 6.9375zm24.039062 12.640625l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm29.179688 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm18.28125 0l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm12.5390625 0l0 -34.359375l6.84375 0l8.140625 24.328125q1.125 3.390625 1.640625 5.078125q0.578125 -1.875 1.828125 -5.5l8.21875 -23.90625l6.125 0l0 34.359375l-4.390625 0l0 -28.765625l-9.984375 28.765625l-4.09375 0l-9.9375 -29.25l0 29.25l-4.390625 0zm55.90625 0l0 -3.65625q-2.90625 4.21875 -7.90625 4.21875q-2.203125 0 -4.109375 -0.84375q-1.90625 -0.84375 -2.84375 -2.125q-0.921875 -1.28125 -1.296875 -3.125q-0.25 -1.25 -0.25 -3.9375l0 -15.421875l4.21875 0l0 13.796875q0 3.3125 0.25 4.453125q0.40625 1.671875 1.6875 2.625q1.296875 0.9375 3.1875 0.9375q1.90625 0 3.5625 -0.96875q1.671875 -0.96875 2.359375 -2.640625q0.6875 -1.6875 0.6875 -4.875l0 -13.328125l4.21875 0l0 24.890625l-3.765625 0zm10.2890625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm19.960938 -3.78125l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm4.1484375 -25.734375l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm7.3984375 0l13.203125 -34.359375l4.90625 0l14.0625 34.359375l-5.1875 0l-4.0 -10.40625l-14.375 0l-3.765625 10.40625l-4.84375 0zm9.921875 -14.109375l11.65625 0l-3.59375 -9.515625q-1.640625 -4.34375 -2.4375 -7.125q-0.65625 3.296875 -1.84375 6.5625l-3.78125 10.078125zm24.5625 16.171875l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125zm41.007812 4.875l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm35.898438 -3.78125l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm4.7578125 3.78125l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.390625 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm19.859375 10.109375l-3.03125 0q7.015625 -11.265625 7.015625 -22.53125q0 -4.40625 -1.015625 -8.75q-0.796875 -3.515625 -2.21875 -6.75q-0.921875 -2.109375 -3.78125 -7.03125l3.03125 0q4.40625 5.890625 6.515625 11.8125q1.796875 5.109375 1.796875 10.6875q0 6.328125 -2.421875 12.25q-2.421875 5.90625 -5.890625 10.3125z" fill-rule="nonzero"/><path fill="#d9ead3" d="m1838.2983 21.514435l502.26782 0l0 182.51968l-502.26782 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m1838.2983 21.514435l502.26782 0l0 182.51968l-502.26782 0z" fill-rule="evenodd"/><path fill="#000000" d="m1878.4908 100.85428l0 -34.359375l15.234375 0q4.59375 0 6.984375 0.921875q2.390625 0.921875 3.8125 3.265625q1.4375 2.34375 1.4375 5.1875q0 3.65625 -2.375 6.171875q-2.359375 2.5 -7.3125 3.171875q1.8125 0.875 2.75 1.71875q1.984375 1.828125 3.765625 4.5625l5.984375 9.359375l-5.71875 0l-4.546875 -7.15625q-2.0 -3.09375 -3.296875 -4.734375q-1.28125 -1.640625 -2.296875 -2.296875q-1.015625 -0.65625 -2.078125 -0.90625q-0.765625 -0.171875 -2.53125 -0.171875l-5.265625 0l0 15.265625l-4.546875 0zm4.546875 -19.203125l9.765625 0q3.125 0 4.875 -0.640625q1.765625 -0.640625 2.671875 -2.0625q0.921875 -1.421875 0.921875 -3.078125q0 -2.4375 -1.78125 -4.0q-1.765625 -1.578125 -5.578125 -1.578125l-10.875 0l0 11.359375zm30.132812 19.203125l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm30.375 -11.046875l4.296875 -0.375q0.296875 2.578125 1.40625 4.234375q1.125 1.65625 3.46875 2.671875q2.34375 1.015625 5.265625 1.015625q2.609375 0 4.59375 -0.765625q2.0 -0.78125 2.96875 -2.125q0.96875 -1.34375 0.96875 -2.9375q0 -1.625 -0.9375 -2.828125q-0.9375 -1.203125 -3.09375 -2.03125q-1.375 -0.53125 -6.109375 -1.671875q-4.734375 -1.140625 -6.640625 -2.140625q-2.453125 -1.296875 -3.671875 -3.203125q-1.203125 -1.90625 -1.203125 -4.28125q0 -2.59375 1.46875 -4.859375q1.484375 -2.265625 4.3125 -3.4375q2.84375 -1.171875 6.3125 -1.171875q3.828125 0 6.734375 1.234375q2.921875 1.234375 4.484375 3.625q1.578125 2.390625 1.703125 5.40625l-4.359375 0.328125q-0.359375 -3.25 -2.390625 -4.90625q-2.015625 -1.671875 -5.984375 -1.671875q-4.125 0 -6.015625 1.515625q-1.875 1.5 -1.875 3.640625q0 1.84375 1.328125 3.046875q1.3125 1.1875 6.859375 2.453125q5.546875 1.25 7.609375 2.1875q3.0 1.375 4.421875 3.5q1.4375 2.125 1.4375 4.890625q0 2.734375 -1.578125 5.171875q-1.5625 2.421875 -4.515625 3.78125q-2.9375 1.34375 -6.609375 1.34375q-4.671875 0 -7.828125 -1.359375q-3.140625 -1.375 -4.9375 -4.09375q-1.796875 -2.734375 -1.890625 -6.1875zm42.3125 11.046875l0 -30.3125l-11.328125 0l0 -4.046875l27.234375 0l0 4.046875l-11.359375 0l0 30.3125l-4.546875 0zm30.125 0l13.203125 -34.359375l4.90625 0l14.062378 34.359375l-5.187378 0l-4.0 -10.40625l-14.375 0l-3.765625 10.40625l-4.84375 0zm9.921875 -14.109375l11.65625 0l-3.59375 -9.515625q-1.640625 -4.34375 -2.4375 -7.125q-0.65625 3.296875 -1.84375 6.5625l-3.78125 10.078125zm25.874878 14.109375l0 -34.359375l12.96875 0q3.421875 0 5.21875 0.328125q2.53125 0.421875 4.234375 1.609375q1.71875 1.171875 2.765625 3.3125q1.046875 2.125 1.046875 4.6875q0 4.375 -2.796875 7.421875q-2.78125 3.03125 -10.078125 3.03125l-8.8125 0l0 13.96875l-4.546875 0zm4.546875 -18.03125l8.890625 0q4.40625 0 6.25 -1.640625q1.859375 -1.640625 1.859375 -4.609375q0 -2.15625 -1.09375 -3.6875q-1.09375 -1.546875 -2.875 -2.03125q-1.140625 -0.3125 -4.234375 -0.3125l-8.796875 0l0 12.28125zm28.25 18.03125l0 -34.359375l4.546875 0l0 34.359375l-4.546875 0zm26.359375 0l0 -21.609375l-3.71875 0l0 -3.28125l3.71875 0l0 -2.65625q0 -2.5 0.453125 -3.71875q0.609375 -1.640625 2.140625 -2.65625q1.53125 -1.03125 4.296875 -1.03125q1.78125 0 3.9375 0.421875l-0.625 3.6875q-1.3125 -0.234375 -2.484375 -0.234375q-1.921875 0 -2.71875 0.828125q-0.796875 0.8125 -0.796875 3.0625l0 2.296875l4.84375 0l0 3.28125l-4.84375 0l0 21.609375l-4.203125 0zm10.7578125 -12.453125q0 -6.90625 3.84375 -10.234375q3.21875 -2.765625 7.828125 -2.765625q5.140625 0 8.390625 3.359375q3.265625 3.359375 3.265625 9.296875q0 4.796875 -1.453125 7.5625q-1.4375 2.75 -4.1875 4.28125q-2.75 1.515625 -6.015625 1.515625q-5.21875 0 -8.453125 -3.34375q-3.21875 -3.359375 -3.21875 -9.671875zm4.34375 0q0 4.78125 2.078125 7.171875q2.09375 2.375 5.25 2.375q3.140625 0 5.21875 -2.390625q2.09375 -2.390625 2.09375 -7.296875q0 -4.609375 -2.09375 -6.984375q-2.09375 -2.390625 -5.21875 -2.390625q-3.15625 0 -5.25 2.375q-2.078125 2.359375 -2.078125 7.140625zm23.882812 12.453125l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm29.898438 0l0 -34.359375l12.96875 0q3.421875 0 5.21875 0.328125q2.53125 0.421875 4.234375 1.609375q1.71875 1.171875 2.765625 3.3125q1.046875 2.125 1.046875 4.6875q0 4.375 -2.796875 7.421875q-2.78125 3.03125 -10.078125 3.03125l-8.8125 0l0 13.96875l-4.546875 0zm4.546875 -18.03125l8.890625 0q4.40625 0 6.25 -1.640625q1.859375 -1.640625 1.859375 -4.609375q0 -2.15625 -1.09375 -3.6875q-1.09375 -1.546875 -2.875 -2.03125q-1.140625 -0.3125 -4.234375 -0.3125l-8.796875 0l0 12.28125zm25.359375 5.578125q0 -6.90625 3.84375 -10.234375q3.21875 -2.765625 7.828125 -2.765625q5.140625 0 8.390625 3.359375q3.265625 3.359375 3.265625 9.296875q0 4.796875 -1.453125 7.5625q-1.4375 2.75 -4.1875 4.28125q-2.75 1.515625 -6.015625 1.515625q-5.21875 0 -8.453125 -3.34375q-3.21875 -3.359375 -3.21875 -9.671875zm4.34375 0q0 4.78125 2.078125 7.171875q2.09375 2.375 5.25 2.375q3.140625 0 5.21875 -2.390625q2.09375 -2.390625 2.09375 -7.296875q0 -4.609375 -2.09375 -6.984375q-2.09375 -2.390625 -5.21875 -2.390625q-3.15625 0 -5.25 2.375q-2.078125 2.359375 -2.078125 7.140625zm23.835938 12.453125l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.7734375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm26.882812 -9.125l4.15625 0.546875q-0.6875 4.28125 -3.484375 6.71875q-2.796875 2.421875 -6.875 2.421875q-5.109375 0 -8.21875 -3.34375q-3.109375 -3.34375 -3.109375 -9.578125q0 -4.03125 1.328125 -7.046875q1.34375 -3.03125 4.078125 -4.53125q2.734375 -1.515625 5.9375 -1.515625q4.0625 0 6.640625 2.046875q2.578125 2.046875 3.296875 5.828125l-4.09375 0.625q-0.59375 -2.5 -2.078125 -3.765625q-1.484375 -1.265625 -3.59375 -1.265625q-3.1875 0 -5.1875 2.28125q-1.984375 2.28125 -1.984375 7.234375q0 5.015625 1.921875 7.296875q1.921875 2.265625 5.015625 2.265625q2.484375 0 4.140625 -1.515625q1.671875 -1.53125 2.109375 -4.703125zm7.578125 18.71875l-0.46875 -3.96875q1.375 0.375 2.40625 0.375q1.40625 0 2.25 -0.46875q0.84375 -0.46875 1.390625 -1.3125q0.390625 -0.625 1.28125 -3.140625q0.125 -0.34375 0.375 -1.03125l-9.4375 -24.9375l4.546875 0l5.171875 14.40625q1.015625 2.75 1.8125 5.765625q0.71875 -2.90625 1.734375 -5.671875l5.3125 -14.5l4.21875 0l-9.46875 25.3125q-1.515625 4.109375 -2.359375 5.65625q-1.125 2.078125 -2.578125 3.046875q-1.453125 0.984375 -3.46875 0.984375q-1.21875 0 -2.71875 -0.515625z" fill-rule="nonzero"/><path fill="#000000" d="m2010.2135 147.8074l4.296875 -0.375q0.296875 2.578125 1.40625 4.234375q1.125 1.65625 3.46875 2.671875q2.34375 1.015625 5.265625 1.015625q2.609375 0 4.59375 -0.765625q2.0 -0.78125 2.96875 -2.125q0.96875 -1.34375 0.96875 -2.9375q0 -1.625 -0.9375 -2.828125q-0.9375 -1.203125 -3.09375 -2.03125q-1.375 -0.53125 -6.109375 -1.671875q-4.734375 -1.140625 -6.640625 -2.140625q-2.453125 -1.296875 -3.671875 -3.203125q-1.203125 -1.90625 -1.203125 -4.28125q0 -2.59375 1.46875 -4.859375q1.484375 -2.265625 4.3125 -3.4375q2.84375 -1.171875 6.3125 -1.171875q3.828125 0 6.734375 1.234375q2.921875 1.234375 4.484375 3.625q1.578125 2.390625 1.703125 5.40625l-4.359375 0.328125q-0.359375 -3.25 -2.390625 -4.90625q-2.015625 -1.671875 -5.984375 -1.671875q-4.125 0 -6.015625 1.515625q-1.875 1.5 -1.875 3.640625q0 1.84375 1.328125 3.046875q1.3125 1.1875 6.859375 2.453125q5.546875 1.25 7.609375 2.1875q3.0 1.375 4.421875 3.5q1.4375 2.125 1.4375 4.890625q0 2.734375 -1.578125 5.171875q-1.5625 2.421875 -4.515625 3.78125q-2.9375 1.34375 -6.609375 1.34375q-4.671875 0 -7.828125 -1.359375q-3.140625 -1.375 -4.9375 -4.09375q-1.796875 -2.734375 -1.890625 -6.1875zm50.062378 3.03125l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671753 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234253 -3.46875 8.390503 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.562378 0q0.234375 4.109375 2.312378 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.843628 -6.828125l13.890503 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.9842529 1.9375 -2.187378 5.1875zm23.460815 14.84375l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm22.9375 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm17.109375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm10.6484375 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm25.914062 2.0625l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125z" fill-rule="nonzero"/><path fill="#d9ead3" d="m1268.7454 21.514435l489.51184 0l0 182.51968l-489.51184 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m1268.7454 21.514435l489.51184 0l0 182.51968l-489.51184 0z" fill-rule="evenodd"/><path fill="#000000" d="m1347.8685 100.85428l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm28.578125 0l9.09375 -12.9375l-8.421875 -11.953125l5.28125 0l3.8125 5.828125q1.078125 1.671875 1.734375 2.796875q1.03125 -1.546875 1.90625 -2.75l4.1875 -5.875l5.046875 0l-8.609375 11.71875l9.265625 13.171875l-5.1875 0l-5.109375 -7.734375l-1.359375 -2.09375l-6.53125 9.828125l-5.109375 0zm36.015625 -3.78125l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm21.164062 -4.234375l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.460938 14.84375l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm16.03125 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm42.929688 -3.078125q-2.34375 2.0 -4.515625 2.828125q-2.15625 0.8125 -4.640625 0.8125q-4.109375 0 -6.3125 -2.0q-2.203125 -2.015625 -2.203125 -5.125q0 -1.828125 0.828125 -3.34375q0.84375 -1.515625 2.1875 -2.421875q1.34375 -0.921875 3.03125 -1.390625q1.25 -0.328125 3.75 -0.625q5.109375 -0.609375 7.53125 -1.453125q0.015625 -0.875 0.015625 -1.109375q0 -2.578125 -1.1875 -3.625q-1.625 -1.4375 -4.8125 -1.4375q-2.96875 0 -4.390625 1.046875q-1.421875 1.046875 -2.09375 3.6875l-4.125 -0.5625q0.5625 -2.640625 1.84375 -4.265625q1.296875 -1.640625 3.734375 -2.515625q2.4375 -0.875 5.640625 -0.875q3.1875 0 5.171875 0.75q2.0 0.75 2.9375 1.890625q0.9375 1.125 1.3125 2.859375q0.21875 1.078125 0.21875 3.890625l0 5.625q0 5.890625 0.265625 7.453125q0.265625 1.546875 1.0625 2.984375l-4.40625 0q-0.65625 -1.3125 -0.84375 -3.078125zm-0.34375 -9.421875q-2.296875 0.9375 -6.890625 1.59375q-2.609375 0.375 -3.6875 0.84375q-1.078125 0.46875 -1.671875 1.375q-0.578125 0.90625 -0.578125 2.0q0 1.6875 1.28125 2.8125q1.28125 1.125 3.734375 1.125q2.4375 0 4.328125 -1.0625q1.90625 -1.0625 2.796875 -2.921875q0.6875 -1.421875 0.6875 -4.21875l0 -1.546875zm10.7109375 12.5l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm20.84375 0l13.203125 -34.359375l4.90625 0l14.0625 34.359375l-5.1875 0l-4.0 -10.40625l-14.375 0l-3.765625 10.40625l-4.84375 0zm9.921875 -14.109375l11.65625 0l-3.59375 -9.515625q-1.640625 -4.34375 -2.4375 -7.125q-0.65625 3.296875 -1.84375 6.5625l-3.78125 10.078125zm24.5625 16.171875l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125zm41.007812 4.875l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm35.898438 -3.78125l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm2.4453125 -3.65625l4.171875 -0.65625q0.34375 2.515625 1.953125 3.859375q1.609375 1.328125 4.484375 1.328125q2.90625 0 4.3125 -1.1875q1.40625 -1.1875 1.40625 -2.78125q0 -1.421875 -1.234375 -2.25q-0.875 -0.5625 -4.3125 -1.421875q-4.640625 -1.171875 -6.4375 -2.03125q-1.796875 -0.859375 -2.71875 -2.359375q-0.921875 -1.515625 -0.921875 -3.34375q0 -1.671875 0.75 -3.078125q0.765625 -1.421875 2.078125 -2.359375q0.984375 -0.734375 2.6875 -1.234375q1.703125 -0.5 3.640625 -0.5q2.9375 0 5.140625 0.84375q2.21875 0.84375 3.265625 2.28125q1.0625 1.4375 1.46875 3.859375l-4.125 0.5625q-0.28125 -1.921875 -1.640625 -3.0q-1.34375 -1.078125 -3.796875 -1.078125q-2.90625 0 -4.15625 0.96875q-1.234375 0.953125 -1.234375 2.234375q0 0.828125 0.515625 1.484375q0.515625 0.671875 1.609375 1.125q0.640625 0.234375 3.734375 1.078125q4.46875 1.1875 6.234375 1.953125q1.78125 0.765625 2.78125 2.21875q1.015625 1.453125 1.015625 3.609375q0 2.109375 -1.234375 3.96875q-1.234375 1.859375 -3.5625 2.890625q-2.3125 1.015625 -5.234375 1.015625q-4.859375 0 -7.40625 -2.015625q-2.53125 -2.015625 -3.234375 -5.984375z" fill-rule="nonzero"/><path fill="#000000" d="m1289.9857 168.96365q-3.5 -4.40625 -5.921875 -10.3125q-2.40625 -5.921875 -2.40625 -12.25q0 -5.578125 1.8125 -10.6875q2.109375 -5.921875 6.515625 -11.8125l3.015625 0q-2.828125 4.875 -3.75 6.96875q-1.421875 3.234375 -2.25 6.75q-1.0 4.375 -1.0 8.8125q0 11.265625 7.0 22.53125l-3.015625 0zm7.875 -10.109375l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm15.9375 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.6640625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.7734375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm14.5390625 0l-3.921875 0l0 -34.359375l4.21875 0l0 12.25q2.671875 -3.34375 6.828125 -3.34375q2.296875 0 4.34375 0.921875q2.046875 0.921875 3.375 2.609375q1.328125 1.671875 2.078125 4.046875q0.75 2.359375 0.75 5.046875q0 6.40625 -3.171875 9.90625q-3.15625 3.484375 -7.59375 3.484375q-4.40625 0 -6.90625 -3.6875l0 3.125zm-0.046875 -12.640625q0 4.484375 1.21875 6.46875q1.984375 3.265625 5.390625 3.265625q2.765625 0 4.78125 -2.40625q2.015625 -2.40625 2.015625 -7.15625q0 -4.875 -1.9375 -7.1875q-1.9375 -2.328125 -4.671875 -2.328125q-2.765625 0 -4.78125 2.40625q-2.015625 2.390625 -2.015625 6.9375zm24.039062 12.640625l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm29.179688 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm18.28125 0l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm12.7734375 0l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm28.578125 0l9.09375 -12.9375l-8.421875 -11.953125l5.28125 0l3.8125 5.828125q1.078125 1.671875 1.734375 2.796875q1.03125 -1.546875 1.90625 -2.75l4.1875 -5.875l5.046875 0l-8.609375 11.71875l9.265625 13.171875l-5.1875 0l-5.109375 -7.734375l-1.359375 -2.09375l-6.53125 9.828125l-5.109375 0zm36.015625 -3.78125l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm21.164062 -4.234375l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.460938 14.84375l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm16.03125 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm42.929688 -3.078125q-2.34375 2.0 -4.515625 2.828125q-2.15625 0.8125 -4.640625 0.8125q-4.109375 0 -6.3125 -2.0q-2.203125 -2.015625 -2.203125 -5.125q0 -1.828125 0.828125 -3.34375q0.84375 -1.515625 2.1875 -2.421875q1.34375 -0.921875 3.03125 -1.390625q1.25 -0.328125 3.75 -0.625q5.109375 -0.609375 7.53125 -1.453125q0.015625 -0.875 0.015625 -1.109375q0 -2.578125 -1.1875 -3.625q-1.625 -1.4375 -4.8125 -1.4375q-2.96875 0 -4.390625 1.046875q-1.421875 1.046875 -2.09375 3.6875l-4.125 -0.5625q0.5625 -2.640625 1.84375 -4.265625q1.296875 -1.640625 3.734375 -2.515625q2.4375 -0.875 5.640625 -0.875q3.1875 0 5.171875 0.75q2.0 0.75 2.9375 1.890625q0.9375 1.125 1.3125 2.859375q0.21875 1.078125 0.21875 3.890625l0 5.625q0 5.890625 0.265625 7.453125q0.265625 1.546875 1.0625 2.984375l-4.40625 0q-0.65625 -1.3125 -0.84375 -3.078125zm-0.34375 -9.421875q-2.296875 0.9375 -6.890625 1.59375q-2.609375 0.375 -3.6875 0.84375q-1.078125 0.46875 -1.671875 1.375q-0.578125 0.90625 -0.578125 2.0q0 1.6875 1.28125 2.8125q1.28125 1.125 3.734375 1.125q2.4375 0 4.328125 -1.0625q1.90625 -1.0625 2.796875 -2.921875q0.6875 -1.421875 0.6875 -4.21875l0 -1.546875zm10.7109375 12.5l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm11.3828125 0l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.390625 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm19.859375 10.109375l-3.03125 0q7.015625 -11.265625 7.015625 -22.53125q0 -4.40625 -1.015625 -8.75q-0.796875 -3.515625 -2.21875 -6.75q-0.921875 -2.109375 -3.78125 -7.03125l3.03125 0q4.40625 5.890625 6.515625 11.8125q1.796875 5.109375 1.796875 10.6875q0 6.328125 -2.421875 12.25q-2.421875 5.90625 -5.890625 10.3125z" fill-rule="nonzero"/><path fill="#93c47d" d="m968.8479 561.48553l603.874 0l0 182.51971l-603.874 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m968.8479 561.48553l603.874 0l0 182.51971l-603.874 0z" fill-rule="evenodd"/><path fill="#000000" d="m1008.4685 669.8254l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm15.9375 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.6640625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.7734375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm14.5390625 0l-3.921875 0l0 -34.359375l4.21875 0l0 12.25q2.671875 -3.34375 6.828125 -3.34375q2.296875 0 4.34375 0.921875q2.046875 0.921875 3.375 2.609375q1.328125 1.671875 2.078125 4.046875q0.75 2.359375 0.75 5.046875q0 6.40625 -3.171875 9.90625q-3.15625 3.484375 -7.59375 3.484375q-4.40625 0 -6.90625 -3.6875l0 3.125zm-0.046875 -12.640625q0 4.484375 1.21875 6.46875q1.984375 3.265625 5.390625 3.265625q2.765625 0 4.78125 -2.40625q2.015625 -2.40625 2.015625 -7.15625q0 -4.875 -1.9375 -7.1875q-1.9375 -2.328125 -4.671875 -2.328125q-2.765625 0 -4.78125 2.40625q-2.015625 2.390625 -2.015625 6.9375zm24.039062 12.640625l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm29.179688 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm18.28125 0l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm8.8984375 0l13.203125 -34.359375l4.90625 0l14.0625 34.359375l-5.1875 0l-4.0 -10.40625l-14.375 0l-3.765625 10.40625l-4.84375 0zm9.921875 -14.109375l11.65625 0l-3.59375 -9.515625q-1.640625 -4.34375 -2.4375 -7.125q-0.65625 3.296875 -1.84375 6.5625l-3.78125 10.078125zm23.65625 6.671875l4.171875 -0.65625q0.34375 2.515625 1.953125 3.859375q1.609375 1.328125 4.484375 1.328125q2.90625 0 4.3125 -1.1875q1.40625 -1.1875 1.40625 -2.78125q0 -1.421875 -1.234375 -2.25q-0.875 -0.5625 -4.3125 -1.421875q-4.640625 -1.171875 -6.4375 -2.03125q-1.796875 -0.859375 -2.71875 -2.359375q-0.921875 -1.515625 -0.921875 -3.34375q0 -1.671875 0.75 -3.078125q0.765625 -1.421875 2.078125 -2.359375q0.984375 -0.734375 2.6875 -1.234375q1.703125 -0.5 3.640625 -0.5q2.9375 0 5.140625 0.84375q2.21875 0.84375 3.265625 2.28125q1.0625 1.4375 1.46875 3.859375l-4.125 0.5625q-0.28125 -1.921875 -1.640625 -3.0q-1.34375 -1.078125 -3.796875 -1.078125q-2.90625 0 -4.15625 0.96875q-1.234375 0.953125 -1.234375 2.234375q0 0.828125 0.515625 1.484375q0.515625 0.671875 1.609375 1.125q0.640625 0.234375 3.734375 1.078125q4.46875 1.1875 6.234375 1.953125q1.78125 0.765625 2.78125 2.21875q1.015625 1.453125 1.015625 3.609375q0 2.109375 -1.234375 3.96875q-1.234375 1.859375 -3.5625 2.890625q-2.3125 1.015625 -5.234375 1.015625q-4.859375 0 -7.40625 -2.015625q-2.53125 -2.015625 -3.234375 -5.984375zm25.5 17.03125l-0.46875 -3.96875q1.375 0.375 2.40625 0.375q1.40625 0 2.25 -0.46875q0.84375 -0.46875 1.390625 -1.3125q0.390625 -0.625 1.28125 -3.140625q0.125 -0.34375 0.375 -1.03125l-9.4375 -24.9375l4.546875 0l5.171875 14.40625q1.015625 2.75 1.8125 5.765625q0.71875 -2.90625 1.734375 -5.671875l5.3125 -14.5l4.21875 0l-9.46875 25.3125q-1.515625 4.109375 -2.359375 5.65625q-1.125 2.078125 -2.578125 3.046875q-1.453125 0.984375 -3.46875 0.984375q-1.21875 0 -2.71875 -0.515625zm24.1875 -9.59375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm42.929688 -9.125l4.15625 0.546875q-0.6875 4.28125 -3.484375 6.71875q-2.796875 2.421875 -6.875 2.421875q-5.109375 0 -8.21875 -3.34375q-3.109375 -3.34375 -3.109375 -9.578125q0 -4.03125 1.328125 -7.046875q1.34375 -3.03125 4.078125 -4.53125q2.734375 -1.515625 5.9375 -1.515625q4.0625 0 6.640625 2.046875q2.578125 2.046875 3.296875 5.828125l-4.09375 0.625q-0.59375 -2.5 -2.078125 -3.765625q-1.484375 -1.265625 -3.59375 -1.265625q-3.1875 0 -5.1875 2.28125q-1.984375 2.28125 -1.984375 7.234375q0 5.015625 1.921875 7.296875q1.921875 2.265625 5.015625 2.265625q2.484375 0 4.140625 -1.515625q1.671875 -1.53125 2.109375 -4.703125zm18.125 9.125l-13.3125 -34.359375l4.921875 0l8.921875 24.953125q1.078125 3.0 1.8125 5.625q0.796875 -2.8125 1.84375 -5.625l9.28125 -24.953125l4.640625 0l-13.453125 34.359375l-4.65625 0zm38.6875 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm39.742188 5.71875l4.15625 0.546875q-0.6875 4.28125 -3.484375 6.71875q-2.796875 2.421875 -6.875 2.421875q-5.109375 0 -8.21875 -3.34375q-3.109375 -3.34375 -3.109375 -9.578125q0 -4.03125 1.328125 -7.046875q1.34375 -3.03125 4.078125 -4.53125q2.734375 -1.515625 5.9375 -1.515625q4.0625 0 6.640625 2.046875q2.578125 2.046875 3.296875 5.828125l-4.09375 0.625q-0.59375 -2.5 -2.078125 -3.765625q-1.484375 -1.265625 -3.59375 -1.265625q-3.1875 0 -5.1875 2.28125q-1.984375 2.28125 -1.984375 7.234375q0 5.015625 1.921875 7.296875q1.921875 2.265625 5.015625 2.265625q2.484375 0 4.140625 -1.515625q1.671875 -1.53125 2.109375 -4.703125zm16.96875 5.34375l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm2.5546875 -8.671875q0 -6.90625 3.84375 -10.234375q3.21875 -2.765625 7.828125 -2.765625q5.140625 0 8.390625 3.359375q3.265625 3.359375 3.265625 9.296875q0 4.796875 -1.453125 7.5625q-1.4375 2.75 -4.1875 4.28125q-2.75 1.515625 -6.015625 1.515625q-5.21875 0 -8.453125 -3.34375q-3.21875 -3.359375 -3.21875 -9.671875zm4.34375 0q0 4.78125 2.078125 7.171875q2.09375 2.375 5.25 2.375q3.140625 0 5.21875 -2.390625q2.09375 -2.390625 2.09375 -7.296875q0 -4.609375 -2.09375 -6.984375q-2.09375 -2.390625 -5.21875 -2.390625q-3.15625 0 -5.25 2.375q-2.078125 2.359375 -2.078125 7.140625zm23.882812 12.453125l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm16.65625 0l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.390625 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0z" fill-rule="nonzero"/><path fill="#b6d7a8" d="m208.77705 378.96588l603.874 0l0 182.51965l-603.874 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m208.77705 378.96588l603.874 0l0 182.51965l-603.874 0z" fill-rule="evenodd"/><path fill="#000000" d="m313.75314 487.30573l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm15.9375 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.6640625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm10.7734375 -29.515625l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm14.5390625 0l-3.921875 0l0 -34.359375l4.21875 0l0 12.25q2.671875 -3.34375 6.828125 -3.34375q2.296875 0 4.34375 0.921875q2.046875 0.921875 3.375 2.609375q1.328125 1.671875 2.078125 4.046875q0.75 2.359375 0.75 5.046875q0 6.40625 -3.171875 9.90625q-3.15625 3.484375 -7.59375 3.484375q-4.40625 0 -6.90625 -3.6875l0 3.125zm-0.046875 -12.640625q0 4.484375 1.21875 6.46875q1.984375 3.265625 5.390625 3.265625q2.765625 0 4.78125 -2.40625q2.015625 -2.40625 2.015625 -7.15625q0 -4.875 -1.9375 -7.1875q-1.9375 -2.328125 -4.671875 -2.328125q-2.765625 0 -4.78125 2.40625q-2.015625 2.390625 -2.015625 6.9375zm24.039062 12.640625l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm29.179688 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm23.507812 14.84375l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0zm18.28125 0l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm22.507812 0l-13.3125 -34.359375l4.921875 0l8.921875 24.953125q1.078125 3.0 1.8125 5.625q0.796875 -2.8125 1.84375 -5.625l9.2812195 -24.953125l4.640625 0l-13.4530945 34.359375l-4.65625 0zm38.68747 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm39.742188 5.71875l4.15625 0.546875q-0.6875 4.28125 -3.484375 6.71875q-2.796875 2.421875 -6.875 2.421875q-5.109375 0 -8.21875 -3.34375q-3.109375 -3.34375 -3.109375 -9.578125q0 -4.03125 1.328125 -7.046875q1.34375 -3.03125 4.078125 -4.53125q2.734375 -1.515625 5.9375 -1.515625q4.0625 0 6.640625 2.046875q2.578125 2.046875 3.296875 5.828125l-4.09375 0.625q-0.59375 -2.5 -2.078125 -3.765625q-1.484375 -1.265625 -3.59375 -1.265625q-3.1875 0 -5.1875 2.28125q-1.984375 2.28125 -1.984375 7.234375q0 5.015625 1.921875 7.296875q1.921875 2.265625 5.015625 2.265625q2.484375 0 4.140625 -1.515625q1.671875 -1.53125 2.109375 -4.703125zm16.96875 5.34375l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm2.5546875 -8.671875q0 -6.90625 3.84375 -10.234375q3.21875 -2.765625 7.828125 -2.765625q5.140625 0 8.390625 3.359375q3.265625 3.359375 3.265625 9.296875q0 4.796875 -1.453125 7.5625q-1.4375 2.75 -4.1875 4.28125q-2.75 1.515625 -6.015625 1.515625q-5.21875 0 -8.453125 -3.34375q-3.21875 -3.359375 -3.21875 -9.671875zm4.34375 0q0 4.78125 2.078125 7.171875q2.09375 2.375 5.25 2.375q3.140625 0 5.21875 -2.390625q2.09375 -2.390625 2.09375 -7.296875q0 -4.609375 -2.09375 -6.984375q-2.09375 -2.390625 -5.21875 -2.390625q-3.15625 0 -5.25 2.375q-2.078125 2.359375 -2.078125 7.140625zm23.882812 12.453125l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm16.65625 0l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.390625 0l0 -24.890625l3.796875 0l0 3.53125q2.734375 -4.09375 7.921875 -4.09375q2.25 0 4.125 0.8125q1.890625 0.796875 2.828125 2.109375q0.9375 1.3125 1.3125 3.125q0.234375 1.171875 0.234375 4.09375l0 15.3125l-4.21875 0l0 -15.140625q0 -2.578125 -0.5 -3.859375q-0.484375 -1.28125 -1.734375 -2.03125q-1.25 -0.765625 -2.9375 -0.765625q-2.703125 0 -4.65625 1.71875q-1.953125 1.703125 -1.953125 6.484375l0 13.59375l-4.21875 0zm33.601562 0l-9.46875 -24.890625l4.453125 0l5.34375 14.90625q0.875 2.40625 1.59375 5.015625q0.5625 -1.96875 1.578125 -4.734375l5.53125 -15.1875l4.328125 0l-9.421875 24.890625l-3.9375 0z" fill-rule="nonzero"/><path fill="#b7b7b7" d="m1767.1183 327.02756l603.8739 0l0 182.51968l-603.8739 0z" fill-rule="evenodd"/><path stroke="#000000" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m1767.1183 327.02756l603.8739 0l0 182.51968l-603.8739 0z" fill-rule="evenodd"/><path fill="#000000" d="m1864.4694 406.3674l0 -34.359375l12.890625 0q3.9375 0 6.3125 1.046875q2.390625 1.03125 3.734375 3.203125q1.34375 2.171875 1.34375 4.53125q0 2.203125 -1.203125 4.15625q-1.1875 1.9375 -3.59375 3.140625q3.109375 0.90625 4.78125 3.109375q1.6875 2.203125 1.6875 5.203125q0 2.421875 -1.03125 4.5q-1.015625 2.0625 -2.515625 3.1875q-1.5 1.125 -3.765625 1.703125q-2.25 0.578125 -5.53125 0.578125l-13.109375 0zm4.546875 -19.921875l7.4375 0q3.015625 0 4.328125 -0.40625q1.734375 -0.515625 2.609375 -1.703125q0.890625 -1.203125 0.890625 -3.0q0 -1.71875 -0.828125 -3.015625q-0.8125 -1.296875 -2.34375 -1.78125q-1.515625 -0.484375 -5.21875 -0.484375l-6.875 0l0 10.390625zm0 15.859375l8.5625 0q2.203125 0 3.09375 -0.15625q1.5625 -0.28125 2.609375 -0.9375q1.0625 -0.65625 1.734375 -1.90625q0.6875 -1.265625 0.6875 -2.90625q0 -1.921875 -0.984375 -3.328125q-0.984375 -1.421875 -2.734375 -2.0q-1.734375 -0.578125 -5.015625 -0.578125l-7.953125 0l0 11.8125zm43.359375 0.984375q-2.34375 2.0 -4.515625 2.828125q-2.15625 0.8125 -4.640625 0.8125q-4.109375 0 -6.3125 -2.0q-2.203125 -2.015625 -2.203125 -5.125q0 -1.828125 0.828125 -3.34375q0.84375 -1.515625 2.1875 -2.421875q1.34375 -0.921875 3.03125 -1.390625q1.25 -0.328125 3.75 -0.625q5.109375 -0.609375 7.53125 -1.453125q0.015625 -0.875 0.015625 -1.109375q0 -2.578125 -1.1875 -3.625q-1.625 -1.4375 -4.8125 -1.4375q-2.96875 0 -4.390625 1.046875q-1.421875 1.046875 -2.09375 3.6875l-4.125 -0.5625q0.5625 -2.640625 1.84375 -4.265625q1.296875 -1.640625 3.734375 -2.515625q2.4375 -0.875 5.640625 -0.875q3.1875 0 5.171875 0.75q2.0 0.75 2.9375 1.890625q0.9375 1.125 1.3125 2.859375q0.21875 1.078125 0.21875 3.890625l0 5.625q0 5.890625 0.265625 7.453125q0.265625 1.546875 1.0625 2.984375l-4.40625 0q-0.65625 -1.3125 -0.84375 -3.078125zm-0.34375 -9.421875q-2.296875 0.9375 -6.890625 1.59375q-2.609375 0.375 -3.6875 0.84375q-1.078125 0.46875 -1.671875 1.375q-0.578125 0.90625 -0.578125 2.0q0 1.6875 1.28125 2.8125q1.28125 1.125 3.734375 1.125q2.4375 0 4.328125 -1.0625q1.90625 -1.0625 2.796875 -2.921875q0.6875 -1.421875 0.6875 -4.21875l0 -1.546875zm20.007812 8.71875l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm20.367188 -5.34375l4.15625 0.546875q-0.6875 4.28125 -3.484375 6.71875q-2.796875 2.421875 -6.875 2.421875q-5.109375 0 -8.21875 -3.34375q-3.109375 -3.34375 -3.109375 -9.578125q0 -4.03125 1.328125 -7.046875q1.34375 -3.03125 4.078125 -4.53125q2.734375 -1.515625 5.9375 -1.515625q4.0625 0 6.640625 2.046875q2.578125 2.046875 3.296875 5.828125l-4.09375 0.625q-0.59375 -2.5 -2.078125 -3.765625q-1.484375 -1.265625 -3.59375 -1.265625q-3.1875 0 -5.1875 2.28125q-1.984375 2.28125 -1.984375 7.234375q0 5.015625 1.921875 7.296875q1.921875 2.265625 5.015625 2.265625q2.484375 0 4.140625 -1.515625q1.671875 -1.53125 2.109375 -4.703125zm7.765625 9.125l0 -34.359375l4.21875 0l0 12.328125q2.953125 -3.421875 7.453125 -3.421875q2.765625 0 4.796875 1.09375q2.046875 1.078125 2.921875 3.0q0.875 1.921875 0.875 5.578125l0 15.78125l-4.21875 0l0 -15.78125q0 -3.15625 -1.375 -4.59375q-1.359375 -1.453125 -3.875 -1.453125q-1.875 0 -3.53125 0.984375q-1.640625 0.96875 -2.34375 2.640625q-0.703125 1.65625 -0.703125 4.578125l0 13.625l-4.21875 0zm43.726562 -8.015625l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm39.648438 14.84375l0 -3.140625q-2.359375 3.703125 -6.953125 3.703125q-2.984375 0 -5.484375 -1.640625q-2.484375 -1.640625 -3.859375 -4.578125q-1.375 -2.953125 -1.375 -6.765625q0 -3.734375 1.234375 -6.765625q1.25 -3.03125 3.734375 -4.640625q2.484375 -1.625 5.5625 -1.625q2.25 0 4.0 0.953125q1.765625 0.9375 2.859375 2.46875l0 -12.328125l4.203125 0l0 34.359375l-3.921875 0zm-13.328125 -12.421875q0 4.78125 2.015625 7.15625q2.015625 2.359375 4.75 2.359375q2.765625 0 4.703125 -2.265625q1.9375 -2.265625 1.9375 -6.90625q0 -5.109375 -1.96875 -7.5q-1.96875 -2.390625 -4.859375 -2.390625q-2.8125 0 -4.703125 2.296875q-1.875 2.296875 -1.875 7.25zm36.203003 1.375l4.296875 -0.375q0.296875 2.578125 1.40625 4.234375q1.125 1.65625 3.46875 2.671875q2.34375 1.015625 5.265625 1.015625q2.609375 0 4.59375 -0.765625q2.0 -0.78125 2.96875 -2.125q0.96875 -1.34375 0.96875 -2.9375q0 -1.625 -0.9375 -2.828125q-0.9375 -1.203125 -3.09375 -2.03125q-1.375 -0.53125 -6.109375 -1.671875q-4.734375 -1.140625 -6.640625 -2.140625q-2.453125 -1.296875 -3.671875 -3.203125q-1.203125 -1.90625 -1.203125 -4.28125q0 -2.59375 1.46875 -4.859375q1.484375 -2.265625 4.3125 -3.4375q2.84375 -1.171875 6.3125 -1.171875q3.828125 0 6.734375 1.234375q2.921875 1.234375 4.484375 3.625q1.578125 2.390625 1.703125 5.40625l-4.359375 0.328125q-0.359375 -3.25 -2.390625 -4.90625q-2.015625 -1.671875 -5.984375 -1.671875q-4.125 0 -6.015625 1.515625q-1.875 1.5 -1.875 3.640625q0 1.84375 1.328125 3.046875q1.3125 1.1875 6.859375 2.453125q5.546875 1.25 7.609375 2.1875q3.0 1.375 4.421875 3.5q1.4375 2.125 1.4375 4.890625q0 2.734375 -1.578125 5.171875q-1.5625 2.421875 -4.515625 3.78125q-2.9375 1.34375 -6.609375 1.34375q-4.671875 0 -7.828125 -1.359375q-3.140625 -1.375 -4.9375 -4.09375q-1.796875 -2.734375 -1.890625 -6.1875zm33.046875 -18.46875l0 -4.84375l4.21875 0l0 4.84375l-4.21875 0zm0 29.515625l0 -24.890625l4.21875 0l0 24.890625l-4.21875 0zm10.6484375 0l0 -24.890625l3.765625 0l0 3.484375q1.171875 -1.828125 3.109375 -2.9375q1.953125 -1.109375 4.4375 -1.109375q2.765625 0 4.53125 1.15625q1.78125 1.140625 2.5 3.203125q2.953125 -4.359375 7.6875 -4.359375q3.703125 0 5.6875 2.046875q2.0 2.046875 2.0 6.3125l0 17.09375l-4.1875 0l0 -15.6875q0 -2.53125 -0.421875 -3.640625q-0.40625 -1.109375 -1.484375 -1.78125q-1.078125 -0.6875 -2.53125 -0.6875q-2.625 0 -4.359375 1.75q-1.734375 1.734375 -1.734375 5.578125l0 14.46875l-4.21875 0l0 -16.171875q0 -2.8125 -1.03125 -4.21875q-1.03125 -1.40625 -3.375 -1.40625q-1.78125 0 -3.296875 0.9375q-1.5 0.9375 -2.1875 2.75q-0.671875 1.796875 -0.671875 5.1875l0 12.921875l-4.21875 0zm56.296875 0l0 -3.65625q-2.90625 4.21875 -7.90625 4.21875q-2.203125 0 -4.109375 -0.84375q-1.90625 -0.84375 -2.84375 -2.125q-0.921875 -1.28125 -1.296875 -3.125q-0.25 -1.25 -0.25 -3.9375l0 -15.421875l4.21875 0l0 13.796875q0 3.3125 0.25 4.453125q0.40625 1.671875 1.6875 2.625q1.296875 0.9375 3.1875 0.9375q1.90625 0 3.5625 -0.96875q1.671875 -0.96875 2.359375 -2.640625q0.6875 -1.6875 0.6875 -4.875l0 -13.328125l4.21875 0l0 24.890625l-3.765625 0zm10.2890625 0l0 -34.359375l4.21875 0l0 34.359375l-4.21875 0zm26.992188 -3.078125q-2.34375 2.0 -4.515625 2.828125q-2.15625 0.8125 -4.640625 0.8125q-4.109375 0 -6.3125 -2.0q-2.203125 -2.015625 -2.203125 -5.125q0 -1.828125 0.828125 -3.34375q0.84375 -1.515625 2.1875 -2.421875q1.34375 -0.921875 3.03125 -1.390625q1.25 -0.328125 3.75 -0.625q5.109375 -0.609375 7.53125 -1.453125q0.015625 -0.875 0.015625 -1.109375q0 -2.578125 -1.1875 -3.625q-1.625 -1.4375 -4.8125 -1.4375q-2.96875 0 -4.390625 1.046875q-1.421875 1.046875 -2.09375 3.6875l-4.125 -0.5625q0.5625 -2.640625 1.84375 -4.265625q1.296875 -1.640625 3.734375 -2.515625q2.4375 -0.875 5.640625 -0.875q3.1875 0 5.171875 0.75q2.0 0.75 2.9375 1.890625q0.9375 1.125 1.3125 2.859375q0.21875 1.078125 0.21875 3.890625l0 5.625q0 5.890625 0.265625 7.453125q0.265625 1.546875 1.0625 2.984375l-4.40625 0q-0.65625 -1.3125 -0.84375 -3.078125zm-0.34375 -9.421875q-2.296875 0.9375 -6.890625 1.59375q-2.609375 0.375 -3.6875 0.84375q-1.078125 0.46875 -1.671875 1.375q-0.578125 0.90625 -0.578125 2.0q0 1.6875 1.28125 2.8125q1.28125 1.125 3.734375 1.125q2.4375 0 4.328125 -1.0625q1.90625 -1.0625 2.796875 -2.921875q0.6875 -1.421875 0.6875 -4.21875l0 -1.546875zm20.007812 8.71875l0.609375 3.734375q-1.78125 0.375 -3.1875 0.375q-2.296875 0 -3.5625 -0.71875q-1.265625 -0.734375 -1.78125 -1.921875q-0.515625 -1.1875 -0.515625 -4.984375l0 -14.3125l-3.09375 0l0 -3.28125l3.09375 0l0 -6.171875l4.203125 -2.53125l0 8.703125l4.234375 0l0 3.28125l-4.234375 0l0 14.546875q0 1.8125 0.21875 2.328125q0.21875 0.515625 0.71875 0.828125q0.515625 0.296875 1.453125 0.296875q0.703125 0 1.84375 -0.171875zm2.5546875 -8.671875q0 -6.90625 3.84375 -10.234375q3.21875 -2.765625 7.828125 -2.765625q5.140625 0 8.390625 3.359375q3.265625 3.359375 3.265625 9.296875q0 4.796875 -1.453125 7.5625q-1.4375 2.75 -4.1875 4.28125q-2.75 1.515625 -6.015625 1.515625q-5.21875 0 -8.453125 -3.34375q-3.21875 -3.359375 -3.21875 -9.671875zm4.34375 0q0 4.78125 2.078125 7.171875q2.09375 2.375 5.25 2.375q3.140625 0 5.21875 -2.390625q2.09375 -2.390625 2.09375 -7.296875q0 -4.609375 -2.09375 -6.984375q-2.09375 -2.390625 -5.21875 -2.390625q-3.15625 0 -5.25 2.375q-2.078125 2.359375 -2.078125 7.140625zm23.882812 12.453125l0 -24.890625l3.796875 0l0 3.765625q1.453125 -2.640625 2.671875 -3.484375q1.234375 -0.84375 2.71875 -0.84375q2.125 0 4.328125 1.359375l-1.453125 3.90625q-1.546875 -0.90625 -3.09375 -0.90625q-1.375 0 -2.484375 0.828125q-1.09375 0.828125 -1.5625 2.3125q-0.703125 2.25 -0.703125 4.921875l0 13.03125l-4.21875 0zm14.34375 -7.4375l4.171875 -0.65625q0.34375 2.515625 1.953125 3.859375q1.609375 1.328125 4.484375 1.328125q2.90625 0 4.3125 -1.1875q1.40625 -1.1875 1.40625 -2.78125q0 -1.421875 -1.234375 -2.25q-0.875 -0.5625 -4.3125 -1.421875q-4.640625 -1.171875 -6.4375 -2.03125q-1.796875 -0.859375 -2.71875 -2.359375q-0.921875 -1.515625 -0.921875 -3.34375q0 -1.671875 0.75 -3.078125q0.765625 -1.421875 2.078125 -2.359375q0.984375 -0.734375 2.6875 -1.234375q1.703125 -0.5 3.640625 -0.5q2.9375 0 5.140625 0.84375q2.21875 0.84375 3.265625 2.28125q1.0625 1.4375 1.46875 3.859375l-4.125 0.5625q-0.28125 -1.921875 -1.640625 -3.0q-1.34375 -1.078125 -3.796875 -1.078125q-2.90625 0 -4.15625 0.96875q-1.234375 0.953125 -1.234375 2.234375q0 0.828125 0.515625 1.484375q0.515625 0.671875 1.609375 1.125q0.640625 0.234375 3.734375 1.078125q4.46875 1.1875 6.234375 1.953125q1.78125 0.765625 2.78125 2.21875q1.015625 1.453125 1.015625 3.609375q0 2.109375 -1.234375 3.96875q-1.234375 1.859375 -3.5625 2.890625q-2.3125 1.015625 -5.234375 1.015625q-4.859375 0 -7.40625 -2.015625q-2.53125 -2.015625 -3.234375 -5.984375z" fill-rule="nonzero"/><path fill="#000000" d="m1966.9225 474.47678q-3.5 -4.40625 -5.921875 -10.3125q-2.40625 -5.921875 -2.40625 -12.25q0 -5.578125 1.8125 -10.6875q2.109375 -5.921875 6.515625 -11.8125l3.015625 0q-2.828125 4.875 -3.75 6.96875q-1.421875 3.234375 -2.25 6.75q-1.0 4.375 -1.0 8.8125q0 11.265625 7.0 22.53125l-3.015625 0zm24.953125 -18.125l4.359375 0.53125q-1.03125 3.828125 -3.828125 5.9375q-2.78125 2.109375 -7.109375 2.109375q-5.46875 0 -8.671875 -3.359375q-3.1875 -3.375 -3.1875 -9.4375q0 -6.28125 3.234375 -9.75q3.234375 -3.46875 8.390625 -3.46875q4.984375 0 8.140625 3.40625q3.171875 3.390625 3.171875 9.546875q0 0.375 -0.015625 1.125l-18.5625 0q0.234375 4.109375 2.3125 6.296875q2.09375 2.171875 5.203125 2.171875q2.328125 0 3.96875 -1.21875q1.640625 -1.21875 2.59375 -3.890625zm-13.84375 -6.828125l13.890625 0q-0.28125 -3.140625 -1.59375 -4.703125q-2.015625 -2.4375 -5.21875 -2.4375q-2.90625 0 -4.890625 1.953125q-1.984375 1.9375 -2.1875 5.1875zm24.695312 14.84375l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm11.3671875 2.0625l4.109375 0.609375q0.25 1.90625 1.421875 2.765625q1.578125 1.171875 4.296875 1.171875q2.921875 0 4.515625 -1.171875q1.59375 -1.171875 2.15625 -3.28125q0.328125 -1.28125 0.3125 -5.421875q-2.765625 3.265625 -6.890625 3.265625q-5.140625 0 -7.953125 -3.703125q-2.8125 -3.703125 -2.8125 -8.890625q0 -3.5625 1.28125 -6.5625q1.296875 -3.015625 3.75 -4.65625q2.453125 -1.640625 5.75 -1.640625q4.40625 0 7.265625 3.5625l0 -3.0l3.890625 0l0 21.515625q0 5.8125 -1.1875 8.234375q-1.171875 2.4375 -3.75 3.84375q-2.5625 1.40625 -6.3125 1.40625q-4.453125 0 -7.203125 -2.015625q-2.734375 -2.0 -2.640625 -6.03125zm3.5 -14.953125q0 4.890625 1.9375 7.140625q1.953125 2.25 4.875 2.25q2.90625 0 4.875 -2.234375q1.96875 -2.234375 1.96875 -7.015625q0 -4.578125 -2.03125 -6.890625q-2.015625 -2.328125 -4.875 -2.328125q-2.8125 0 -4.78125 2.296875q-1.96875 2.28125 -1.96875 6.78125zm25.164062 12.890625l0 -4.8125l4.8125 0l0 4.8125l-4.8125 0zm13.242065 0l0 -4.8125l4.8125 0l0 4.8125q0 2.65625 -0.9375 4.28125q-0.9375 1.625 -2.984375 2.515625l-1.171875 -1.796875q1.34375 -0.59375 1.96875 -1.734375q0.640625 -1.125 0.703125 -3.265625l-2.390625 0zm26.203125 0l0 -34.359375l24.84375 0l0 4.046875l-20.296875 0l0 10.53125l19.015625 0l0 4.03125l-19.015625 0l0 11.6875l21.09375 0l0 4.0625l-25.640625 0zm31.734375 0l0 -34.359375l4.546875 0l0 30.296875l16.921875 0l0 4.0625l-21.46875 0zm27.117188 0l0 -34.359375l23.1875 0l0 4.046875l-18.640625 0l0 10.640625l16.125 0l0 4.0625l-16.125 0l0 15.609375l-4.546875 0zm31.320312 10.109375l-3.03125 0q7.015625 -11.265625 7.015625 -22.53125q0 -4.40625 -1.015625 -8.75q-0.796875 -3.515625 -2.21875 -6.75q-0.921875 -2.109375 -3.78125 -7.03125l3.03125 0q4.40625 5.890625 6.515625 11.8125q1.796875 5.109375 1.796875 10.6875q0 6.328125 -2.421875 12.25q-2.421875 5.90625 -5.890625 10.3125z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m284.4882 204.03412l226.2362 174.92914" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m284.4882 204.03412l188.26349 145.56808" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m464.6689 360.05566l36.803436 11.753754l-20.637909 -32.660675z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m812.65106 470.2257l458.14178 91.275635" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m812.65106 470.2257l411.06696 81.89685" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m1221.1361 565.0818l38.18689 -5.8656006l-33.023193 -20.052734z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m910.85974 204.03412l359.937 357.4488" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m910.85974 204.03412l325.87842 323.6256" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m1227.427 537.0357l35.07129 16.206177l-16.448975 -34.95813z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m1513.5013 204.03412l-242.70874 357.4488" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m1513.5013 204.03412l-215.74487 317.7379" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m1286.8245 514.34924l-9.462036 37.45813l31.325928 -22.612488z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m1838.2983 112.77428l-80.031494 0" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m1838.2983 112.77428l-32.031494 0" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m1806.2668 99.56042l-36.304688 13.21386l36.304688 13.21386z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m1767.1183 418.2874l-496.34644 143.21259" fill-rule="evenodd"/><path stroke="#164863" stroke-width="8.0" stroke-linejoin="round" stroke-linecap="butt" d="m1767.1183 418.2874l-450.22778 129.90582" fill-rule="evenodd"/><path fill="#164863" stroke="#164863" stroke-width="8.0" stroke-linecap="butt" d="m1313.2273 535.49725l-31.218628 22.76056l38.545044 2.6313477z" fill-rule="evenodd"/></g></svg>
\ No newline at end of file
diff --git a/doc/source/rllib-models.rst b/doc/source/rllib-models.rst
index a234ba0022420..9e7070b66c489 100644
--- a/doc/source/rllib-models.rst
+++ b/doc/source/rllib-models.rst
@@ -13,15 +13,24 @@ Built-in Models and Preprocessors
 
 RLlib picks default models based on a simple heuristic: a `vision network <https://github.com/ray-project/ray/blob/master/python/ray/rllib/models/visionnet.py>`__ for image observations, and a `fully connected network <https://github.com/ray-project/ray/blob/master/python/ray/rllib/models/fcnet.py>`__ for everything else. These models can be configured via the ``model`` config key, documented in the model `catalog <https://github.com/ray-project/ray/blob/master/python/ray/rllib/models/catalog.py>`__. Note that you'll probably have to configure ``conv_filters`` if your environment observations have custom sizes, e.g., ``"model": {"dim": 42, "conv_filters": [[16, [4, 4], 2], [32, [4, 4], 2], [512, [11, 11], 1]]}`` for 42x42 observations.
 
-In addition, if you set ``"model": {"use_lstm": true}``, then the model output will be further processed by a `LSTM cell <https://github.com/ray-project/ray/blob/master/python/ray/rllib/models/lstm.py>`__. More generally, RLlib supports the use of recurrent models for its algorithms (A3C, PG out of the box), and RNN support is built into its policy evaluation utilities.
+In addition, if you set ``"model": {"use_lstm": true}``, then the model output will be further processed by a `LSTM cell <https://github.com/ray-project/ray/blob/master/python/ray/rllib/models/lstm.py>`__. More generally, RLlib supports the use of recurrent models for its policy gradient algorithms (A3C, PPO, PG, IMPALA), and RNN support is built into its policy evaluation utilities.
 
-For preprocessors, RLlib tries to pick one of its built-in preprocessor based on the environment's observation space. Discrete observations are one-hot encoded, Atari observations downscaled, and Tuple observations flattened (there isn't native tuple support yet, but you can reshape the flattened observation in a custom model). Note that for Atari, RLlib defaults to using the `DeepMind preprocessors <https://github.com/ray-project/ray/blob/master/python/ray/rllib/env/atari_wrappers.py>`__, which are also used by the OpenAI baselines library.
+For preprocessors, RLlib tries to pick one of its built-in preprocessor based on the environment's observation space. Discrete observations are one-hot encoded, Atari observations downscaled, and Tuple and Dict observations flattened (these are unflattened and accessible via the ``input_dict`` parameter in custom models). Note that for Atari, RLlib defaults to using the `DeepMind preprocessors <https://github.com/ray-project/ray/blob/master/python/ray/rllib/env/atari_wrappers.py>`__, which are also used by the OpenAI baselines library.
 
+Built-in Model Parameters
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The following is a list of the built-in model hyperparameters:
+
+.. literalinclude:: ../../python/ray/rllib/models/catalog.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
 
 Custom Models
 -------------
 
-Custom models should subclass the common RLlib `model class <https://github.com/ray-project/ray/blob/master/python/ray/rllib/models/model.py>`__ and override the ``_build_layers`` method. This method takes in a tensor input (observation), and returns a feature layer and float vector of the specified output size. The model can then be registered and used in place of a built-in model:
+Custom models should subclass the common RLlib `model class <https://github.com/ray-project/ray/blob/master/python/ray/rllib/models/model.py>`__ and override the ``_build_layers_v2`` method. This method takes in a dict of tensor inputs (the observation ``obs``, ``prev_action``, and ``prev_reward``, ``is_training``), and returns a feature layer and float vector of the specified output size. You can also override the ``value_function`` method to implement a custom value branch. A self-supervised loss can be defined via the ``loss`` method. The model can then be registered and used in place of a built-in model:
 
 .. code-block:: python
 
@@ -30,12 +39,66 @@ Custom models should subclass the common RLlib `model class <https://github.com/
     from ray.rllib.models import ModelCatalog, Model
 
     class MyModelClass(Model):
-        def _build_layers(self, inputs, num_outputs, options):
-            layer1 = slim.fully_connected(inputs, 64, ...)
-            layer2 = slim.fully_connected(inputs, 64, ...)
+        def _build_layers_v2(self, input_dict, num_outputs, options):
+            """Define the layers of a custom model.
+
+            Arguments:
+                input_dict (dict): Dictionary of input tensors, including "obs",
+                    "prev_action", "prev_reward", "is_training".
+                num_outputs (int): Output tensor must be of size
+                    [BATCH_SIZE, num_outputs].
+                options (dict): Model options.
+
+            Returns:
+                (outputs, feature_layer): Tensors of size [BATCH_SIZE, num_outputs]
+                    and [BATCH_SIZE, desired_feature_size].
+
+            When using dict or tuple observation spaces, you can access
+            the nested sub-observation batches here as well:
+
+            Examples:
+                >>> print(input_dict)
+                {'prev_actions': <tf.Tensor shape=(?,) dtype=int64>,
+                 'prev_rewards': <tf.Tensor shape=(?,) dtype=float32>,
+                 'is_training': <tf.Tensor shape=(), dtype=bool>,
+                 'obs': OrderedDict([
+                    ('sensors', OrderedDict([
+                        ('front_cam', [
+                            <tf.Tensor shape=(?, 10, 10, 3) dtype=float32>,
+                            <tf.Tensor shape=(?, 10, 10, 3) dtype=float32>]),
+                        ('position', <tf.Tensor shape=(?, 3) dtype=float32>),
+                        ('velocity', <tf.Tensor shape=(?, 3) dtype=float32>)]))])}
+            """
+
+            layer1 = slim.fully_connected(input_dict["obs"], 64, ...)
+            layer2 = slim.fully_connected(layer1, 64, ...)
             ...
             return layerN, layerN_minus_1
 
+        def value_function(self):
+            """Builds the value function output.
+
+            This method can be overridden to customize the implementation of the
+            value function (e.g., not sharing hidden layers).
+
+            Returns:
+                Tensor of size [BATCH_SIZE] for the value function.
+            """
+            return tf.reshape(
+                linear(self.last_layer, 1, "value", normc_initializer(1.0)), [-1])
+
+        def loss(self):
+            """Builds any built-in (self-supervised) loss for the model.
+
+            For example, this can be used to incorporate auto-encoder style losses.
+            Note that this loss has to be included in the policy graph loss to have
+            an effect (done for built-in algorithms).
+
+            Returns:
+                Scalar tensor for the self-supervised loss.
+            """
+            return tf.constant(0.0)
+
     ModelCatalog.register_custom_model("my_model", MyModelClass)
 
     ray.init()
@@ -46,12 +109,53 @@ Custom models should subclass the common RLlib `model class <https://github.com/
         },
     })
 
-For a full example of a custom model in code, see the `Carla RLlib model <https://github.com/ray-project/ray/blob/master/examples/carla/models.py>`__ and associated `training scripts <https://github.com/ray-project/ray/tree/master/examples/carla>`__. The ``CarlaModel`` class defined there operates over a composite (Tuple) observation space including both images and scalar measurements.
+For a full example of a custom model in code, see the `Carla RLlib model <https://github.com/ray-project/ray/blob/master/python/ray/rllib/examples/carla/models.py>`__ and associated `training scripts <https://github.com/ray-project/ray/tree/master/python/ray/rllib/examples/carla>`__. You can also reference the `unit tests <https://github.com/ray-project/ray/blob/master/python/ray/rllib/test/test_nested_spaces.py>`__ for Tuple and Dict spaces, which show how to access nested observation fields.
+
+Custom Recurrent Models
+~~~~~~~~~~~~~~~~~~~~~~~
+
+Instead of using the ``use_lstm: True`` option, it can be preferable use a custom recurrent model. This provides more control over postprocessing of the LSTM output and can also allow the use of multiple LSTM cells to process different portions of the input. The only difference from a normal custom model is that you have to define ``self.state_init``, ``self.state_in``, and ``self.state_out``. You can refer to the existing `lstm.py <https://github.com/ray-project/ray/blob/master/python/ray/rllib/models/lstm.py>`__ model as an example to implement your own model:
+
+.. code-block:: python
+
+    class MyCustomLSTM(Model):
+        def _build_layers_v2(self, input_dict, num_outputs, options):
+            # Some initial layers to process inputs, shape [BATCH, OBS...].
+            features = some_hidden_layers(input_dict["obs"])
+
+            # Add back the nested time dimension for tf.dynamic_rnn, new shape
+            # will be [BATCH, MAX_SEQ_LEN, OBS...].
+            last_layer = add_time_dimension(features, self.seq_lens)
+
+            # Setup the LSTM cell (see lstm.py for an example)
+            lstm = rnn.BasicLSTMCell(256, state_is_tuple=True)
+            self.state_init = ...
+            self.state_in = ...
+            lstm_out, lstm_state = tf.nn.dynamic_rnn(
+                lstm,
+                last_layer,
+                initial_state=...,
+                sequence_length=self.seq_lens,
+                time_major=False,
+                dtype=tf.float32)
+            self.state_out = list(lstm_state)
+
+            # Drop the time dimension again so back to shape [BATCH, OBS...].
+            # Note that we retain the zero padding (see issue #2992).
+            last_layer = tf.reshape(lstm_out, [-1, cell_size])
+            logits = linear(last_layer, num_outputs, "action",
+                            normc_initializer(0.01))
+            return logits, last_layer
+
+Batch Normalization
+~~~~~~~~~~~~~~~~~~~
+
+You can use ``tf.layers.batch_normalization(x, training=input_dict["is_training"])`` to add batch norm layers to your custom model: `code example <https://github.com/ray-project/ray/blob/master/python/ray/rllib/examples/batch_norm_model.py>`__. RLlib will automatically run the update ops for the batch norm layers during optimization (see `tf_policy_graph.py <https://github.com/ray-project/ray/blob/master/python/ray/rllib/evaluation/tf_policy_graph.py>`__ and `multi_gpu_impl.py <https://github.com/ray-project/ray/blob/master/python/ray/rllib/optimizers/multi_gpu_impl.py>`__ for the exact handling of these updates).
 
 Custom Preprocessors
 --------------------
 
-Similarly, custom preprocessors should subclass the RLlib `preprocessor class <https://github.com/ray-project/ray/blob/master/python/ray/rllib/models/preprocessors.py>`__ and be registered in the model catalog:
+Similarly, custom preprocessors should subclass the RLlib `preprocessor class <https://github.com/ray-project/ray/blob/master/python/ray/rllib/models/preprocessors.py>`__ and be registered in the model catalog. Note that you can alternatively use `gym wrapper classes <https://github.com/openai/gym/tree/master/gym/wrappers>`__ around your environment instead of preprocessors.
 
 .. code-block:: python
 
@@ -60,8 +164,8 @@ Similarly, custom preprocessors should subclass the RLlib `preprocessor class <h
     from ray.rllib.models.preprocessors import Preprocessor
 
     class MyPreprocessorClass(Preprocessor):
-        def _init(self):
-            self.shape = ...  # perhaps varies depending on self._options 
+        def _init_shape(self, obs_space, options):
+            return new_shape  # can vary depending on inputs
 
         def transform(self, observation):
             return ...  # return the preprocessed observation
@@ -124,7 +228,54 @@ Then, you can create an agent with your custom policy graph by:
     DDPGAgent._policy_graph = CustomDDPGPolicyGraph
     agent = DDPGAgent(...)
 
-That's it. In this example we overrode existing methods of the existing DDPG policy graph, i.e., `_build_q_network`, `_build_p_network`, `_build_action_network`, `_build_actor_critic_loss`, but you can also replace the entire graph class entirely.
+In this example we overrode existing methods of the existing DDPG policy graph, i.e., `_build_q_network`, `_build_p_network`, `_build_action_network`, `_build_actor_critic_loss`, but you can also replace the entire graph class entirely.
+
+Variable-length / Parametric Action Spaces
+------------------------------------------
+
+Custom models can be used to work with environments where (1) the set of valid actions varies per step, and/or (2) the number of valid actions is very large, as in `OpenAI Five <https://neuro.cs.ut.ee/the-use-of-embeddings-in-openai-five/>`__ and `Horizon <https://arxiv.org/abs/1811.00260>`__. The general idea is that the meaning of actions can be completely conditioned on the observation, i.e., the ``a`` in ``Q(s, a)`` becomes just a token in ``[0, MAX_AVAIL_ACTIONS)`` that only has meaning in the context of ``s``. This works with algorithms in the `DQN and policy-gradient families <rllib-env.html>`__ and can be implemented as follows:
+
+1. The environment should return a mask and/or list of valid action embeddings as part of the observation for each step. To enable batching, the number of actions can be allowed to vary from 1 to some max number:
+
+.. code-block:: python
+
+   class MyParamActionEnv(gym.Env):
+       def __init__(self, max_avail_actions):
+           self.action_space = Discrete(max_avail_actions)
+           self.observation_space = Dict({
+               "action_mask": Box(0, 1, shape=(max_avail_actions, )),
+               "avail_actions": Box(-1, 1, shape=(max_avail_actions, action_embedding_sz)),
+               "real_obs": ...,
+           })
+
+2. A custom model can be defined that can interpret the ``action_mask`` and ``avail_actions`` portions of the observation. Here the model computes the action logits via the dot product of some network output and each action embedding. Invalid actions can be masked out of the softmax by scaling the probability to zero:
+
+.. code-block:: python
+
+    class MyParamActionModel(Model):
+        def _build_layers_v2(self, input_dict, num_outputs, options):
+            avail_actions = input_dict["obs"]["avail_actions"]
+            action_mask = input_dict["obs"]["action_mask"]
+
+            output = FullyConnectedNetwork(
+                input_dict["obs"]["real_obs"], num_outputs=action_embedding_sz)
+
+            # Expand the model output to [BATCH, 1, EMBED_SIZE]. Note that the
+            # avail actions tensor is of shape [BATCH, MAX_ACTIONS, EMBED_SIZE].
+            intent_vector = tf.expand_dims(output, 1)
+
+            # Shape of logits is [BATCH, MAX_ACTIONS].
+            action_logits = tf.reduce_sum(avail_actions * intent_vector, axis=2)
+
+            # Mask out invalid actions (use tf.float32.min for stability)
+            inf_mask = tf.maximum(tf.log(action_mask), tf.float32.min)
+            masked_logits = inf_mask + action_logits
+
+            return masked_logits, last_layer
+
+
+Depending on your use case it may make sense to use just the masking, just action embeddings, or both. For a runnable example of this in code, check out `parametric_action_cartpole.py <https://github.com/ray-project/ray/blob/master/python/ray/rllib/examples/parametric_action_cartpole.py>`__. Note that since masking introduces ``tf.float32.min`` values into the model output, this technique might not work with all algorithm options. For example, algorithms might crash if they incorrectly process the ``tf.float32.min`` values. The cartpole example has working configurations for DQN and several policy gradient algorithms.
+
 
 Model-Based Rollouts
 --------------------
@@ -137,7 +288,8 @@ With a custom policy graph, you can also perform model-based rollouts and option
              def compute_actions(self,
                                  obs_batch,
                                  state_batches,
-                                 is_training=False,
+                                 prev_action_batch=None,
+                                 prev_reward_batch=None,
                                  episodes=None):
                 # compute a batch of actions based on the current obs_batch
                 # and state of each episode (i.e., for multiagent). You can do
diff --git a/doc/source/rllib-training.rst b/doc/source/rllib-training.rst
index 25cd0d8931850..dc350d272c99e 100644
--- a/doc/source/rllib-training.rst
+++ b/doc/source/rllib-training.rst
@@ -10,11 +10,11 @@ be trained, checkpointed, or an action computed.
 
 .. image:: rllib-api.svg
 
-You can train a simple DQN agent with the following command
+You can train a simple DQN agent with the following command:
 
 .. code-block:: bash
 
-    python ray/python/ray/rllib/train.py --run DQN --env CartPole-v0
+    rllib train --run DQN --env CartPole-v0
 
 By default, the results will be logged to a subdirectory of ``~/ray_results``.
 This subdirectory will contain a file ``params.json`` which contains the
@@ -26,10 +26,12 @@ training process with TensorBoard by running
 
      tensorboard --logdir=~/ray_results
 
-The ``train.py`` script has a number of options you can show by running
+The ``rllib train`` command (same as the ``train.py`` script in the repo) has a number of options you can show by running:
 
 .. code-block:: bash
 
+    rllib train --help
+    -or-
     python ray/python/ray/rllib/train.py --help
 
 The most important options are for choosing the environment
@@ -37,46 +39,57 @@ with ``--env`` (any OpenAI gym environment including ones registered by the user
 can be used) and for choosing the algorithm with ``--run``
 (available options are ``PPO``, ``PG``, ``A2C``, ``A3C``, ``IMPALA``, ``ES``, ``DDPG``, ``DQN``, ``APEX``, and ``APEX_DDPG``).
 
+Evaluating Trained Agents
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+In order to save checkpoints from which to evaluate agents,
+set ``--checkpoint-freq`` (number of training iterations between checkpoints)
+when running ``rllib train``.
+
+
+An example of evaluating a previously trained DQN agent is as follows:
+
+.. code-block:: bash
+
+    rllib rollout \
+        ~/ray_results/default/DQN_CartPole-v0_0upjmdgr0/checkpoint_1/checkpoint-1 \
+        --run DQN --env CartPole-v0 --steps 10000
+
+The ``rollout.py`` helper script reconstructs a DQN agent from the checkpoint
+located at ``~/ray_results/default/DQN_CartPole-v0_0upjmdgr0/checkpoint_1/checkpoint-1``
+and renders its behavior in the environment specified by ``--env``.
+
+Configuration
+-------------
+
 Specifying Parameters
 ~~~~~~~~~~~~~~~~~~~~~
 
 Each algorithm has specific hyperparameters that can be set with ``--config``, in addition to a number of `common hyperparameters <https://github.com/ray-project/ray/blob/master/python/ray/rllib/agents/agent.py>`__. See the
 `algorithms documentation <rllib-algorithms.html>`__ for more information.
 
-In an example below, we train A2C by specifying 8 workers through the config flag. We also set ``"monitor": true`` to save episode videos to the result dir:
+In an example below, we train A2C by specifying 8 workers through the config flag.
 
 .. code-block:: bash
 
-    python ray/python/ray/rllib/train.py --env=PongDeterministic-v4 \
-        --run=A2C --config '{"num_workers": 8, "monitor": true}'
-
-.. image:: rllib-config.svg
+    rllib train --env=PongDeterministic-v4 --run=A2C --config '{"num_workers": 8}'
 
 Specifying Resources
 ~~~~~~~~~~~~~~~~~~~~
 
-You can control the degree of parallelism used by setting the ``num_workers`` hyperparameter for most agents. Many agents also provide a ``num_gpus`` or ``gpu`` option. In addition, you can allocate a fraction of a GPU by setting ``gpu_fraction: f``. For example, with DQN you can pack five agents onto one GPU by setting ``gpu_fraction: 0.2``. Note that fractional GPU support requires enabling the experimental Xray backend by setting the environment variable ``RAY_USE_XRAY=1``.
->>>>>>> 01b030bd57f014386aa5e4c67a2e069938528abb
-
-Evaluating Trained Agents
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-In order to save checkpoints from which to evaluate agents,
-set ``--checkpoint-freq`` (number of training iterations between checkpoints)
-when running ``train.py``.
-
+You can control the degree of parallelism used by setting the ``num_workers`` hyperparameter for most agents. The number of GPUs the driver should use can be set via the ``num_gpus`` option. Similarly, the resource allocation to workers can be controlled via ``num_cpus_per_worker``, ``num_gpus_per_worker``, and ``custom_resources_per_worker``. The number of GPUs can be a fractional quantity to allocate only a fraction of a GPU. For example, with DQN you can pack five agents onto one GPU by setting ``num_gpus: 0.2``. Note that in Ray < 0.6.0 fractional GPU support requires setting the environment variable ``RAY_USE_XRAY=1``.
 
-An example of evaluating a previously trained DQN agent is as follows:
+.. image:: rllib-config.svg
 
-.. code-block:: bash
+Common Parameters
+~~~~~~~~~~~~~~~~~
 
-    python ray/python/ray/rllib/rollout.py \
-          ~/ray_results/default/DQN_CartPole-v0_0upjmdgr0/checkpoint-1 \
-          --run DQN --env CartPole-v0
+The following is a list of the common agent hyperparameters:
 
-The ``rollout.py`` helper script reconstructs a DQN agent from the checkpoint
-located at ``~/ray_results/default/DQN_CartPole-v0_0upjmdgr0/checkpoint-1``
-and renders its behavior in the environment specified by ``--env``.
+.. literalinclude:: ../../python/ray/rllib/agents/agent.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
 
 Tuned Examples
 ~~~~~~~~~~~~~~
@@ -86,16 +99,16 @@ Some good hyperparameters and settings are available in
 (some of them are tuned to run on GPUs). If you find better settings or tune
 an algorithm on a different domain, consider submitting a Pull Request!
 
-You can run these with the ``train.py`` script as follows:
+You can run these with the ``rllib train`` command as follows:
 
 .. code-block:: bash
 
-    python ray/python/ray/rllib/train.py -f /path/to/tuned/example.yaml
+    rllib train -f /path/to/tuned/example.yaml
 
 Python API
 ----------
 
-The Python API provides the needed flexibility for applying RLlib to new problems. You will need to use this API if you wish to use custom environments, preprocesors, or models with RLlib.
+The Python API provides the needed flexibility for applying RLlib to new problems. You will need to use this API if you wish to use `custom environments, preprocessors, or models <rllib-models.html>`__ with RLlib.
 
 Here is an example of the basic usage:
 
@@ -155,7 +168,7 @@ Tune will schedule the trials to run in parallel on your Ray cluster:
     == Status ==
     Using FIFO scheduling algorithm.
     Resources requested: 4/4 CPUs, 0/0 GPUs
-    Result logdir: /home/eric/ray_results/my_experiment
+    Result logdir: ~/ray_results/my_experiment
     PENDING trials:
      - PPO_CartPole-v0_2_sgd_stepsize=0.0001:	PENDING
     RUNNING trials:
@@ -184,11 +197,194 @@ You can also access just the "master" copy of the agent state through ``agent.lo
     agent.optimizer.foreach_evaluator_with_index(
         lambda ev, i: ev.for_policy(lambda p: p.get_weights()))
 
+Global Coordination
+~~~~~~~~~~~~~~~~~~~
+Sometimes, it is necessary to coordinate between pieces of code that live in different processes managed by RLlib. For example, it can be useful to maintain a global average of a certain variable, or centrally control a hyperparameter used by policies. Ray provides a general way to achieve this through *named actors* (learn more about Ray actors `here <actors.html>`__). As an example, consider maintaining a shared global counter that is incremented by environments and read periodically from your driver program:
+
+.. code-block:: python
+
+    from ray.experimental import named_actors
+
+    @ray.remote
+    class Counter:
+       def __init__(self):
+          self.count = 0
+       def inc(self, n):
+          self.count += n
+       def get(self):
+          return self.count
+
+    # on the driver
+    counter = Counter.remote()
+    named_actors.register_actor("global_counter", counter)
+    print(ray.get(counter.get.remote()))  # get the latest count
+
+    # in your envs
+    counter = named_actors.get_actor("global_counter")
+    counter.inc.remote(1)  # async call to increment the global count
+
+Ray actors provide high levels of performance, so in more complex cases they can be used implement communication patterns such as parameter servers and allreduce.
+
+Callbacks and Custom Metrics
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can provide callback functions to be called at points during policy evaluation. These functions have access to an info dict containing state for the current `episode <https://github.com/ray-project/ray/blob/master/python/ray/rllib/evaluation/episode.py>`__. Custom state can be stored for the `episode <https://github.com/ray-project/ray/blob/master/python/ray/rllib/evaluation/episode.py>`__ in the ``info["episode"].user_data`` dict, and custom scalar metrics reported by saving values to the ``info["episode"].custom_metrics`` dict. These custom metrics will be aggregated and reported as part of training results. The following example (full code `here <https://github.com/ray-project/ray/blob/master/python/ray/rllib/examples/custom_metrics_and_callbacks.py>`__) logs a custom metric from the environment:
+
+.. code-block:: python
+
+    def on_episode_start(info):
+        print(info.keys())  # -> "env", 'episode"
+        episode = info["episode"]
+        print("episode {} started".format(episode.episode_id))
+        episode.user_data["pole_angles"] = []
+
+    def on_episode_step(info):
+        episode = info["episode"]
+        pole_angle = abs(episode.last_observation_for()[2])
+        episode.user_data["pole_angles"].append(pole_angle)
+
+    def on_episode_end(info):
+        episode = info["episode"]
+        pole_angle = np.mean(episode.user_data["pole_angles"])
+        print("episode {} ended with length {} and pole angles {}".format(
+            episode.episode_id, episode.length, pole_angle))
+        episode.custom_metrics["pole_angle"] = pole_angle
+
+    def on_train_result(info):
+        print("agent.train() result: {} -> {} episodes".format(
+            info["agent"].__name__, info["result"]["episodes_this_iter"]))
+
+    ray.init()
+    trials = tune.run_experiments({
+        "test": {
+            "env": "CartPole-v0",
+            "run": "PG",
+            "config": {
+                "callbacks": {
+                    "on_episode_start": tune.function(on_episode_start),
+                    "on_episode_step": tune.function(on_episode_step),
+                    "on_episode_end": tune.function(on_episode_end),
+                    "on_train_result": tune.function(on_train_result),
+                },
+            },
+        }
+    })
+
+Custom metrics can be accessed and visualized like any other training result:
+
+.. image:: custom_metric.png
+
+Example: Curriculum Learning
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Let's look at two ways to use the above APIs to implement `curriculum learning <https://bair.berkeley.edu/blog/2017/12/20/reverse-curriculum/>`__. In curriculum learning, the agent task is adjusted over time to improve the learning process. Suppose that we have an environment class with a ``set_phase()`` method that we can call to adjust the task difficulty over time:
+
+Approach 1: Use the Agent API and update the environment between calls to ``train()``. This example shows the agent being run inside a Tune function:
+
+.. code-block:: python
+
+    import ray
+    from ray import tune
+    from ray.rllib.agents.ppo import PPOAgent
+
+    def train(config, reporter):
+        agent = PPOAgent(config=config, env=YourEnv)
+        while True:
+            result = agent.train()
+            reporter(**result)
+            if result["episode_reward_mean"] > 200:
+                phase = 2
+            elif result["episode_reward_mean"] > 100:
+                phase = 1
+            else:
+                phase = 0
+            agent.optimizer.foreach_evaluator(lambda ev: ev.env.set_phase(phase))
+
+    ray.init()
+    tune.run_experiments({
+        "curriculum": {
+            "run": train,
+            "config": {
+                "num_gpus": 0,
+                "num_workers": 2,
+            },
+            "trial_resources": {
+                "cpu": 1,
+                "gpu": lambda spec: spec.config.num_gpus,
+                "extra_cpu": lambda spec: spec.config.num_workers,
+            },
+        },
+    })
+
+Approach 2: Use the callbacks API to update the environment on new training results:
+
+.. code-block:: python
+
+    import ray
+    from ray import tune
+
+    def on_train_result(info):
+        result = info["result"]
+        if result["episode_reward_mean"] > 200:
+            phase = 2
+        elif result["episode_reward_mean"] > 100:
+            phase = 1
+        else:
+            phase = 0
+        agent = info["agent"]
+        agent.optimizer.foreach_evaluator(lambda ev: ev.env.set_phase(phase))
+
+    ray.init()
+    tune.run_experiments({
+        "curriculum": {
+            "run": "PPO",
+            "env": YourEnv,
+            "config": {
+                "callbacks": {
+                    "on_train_result": tune.function(on_train_result),
+                },
+            },
+        },
+    })
+
+Debugging
+---------
+
+Gym Monitor
+~~~~~~~~~~~
+
+The ``"monitor": true`` config can be used to save Gym episode videos to the result dir. For example:
+
+.. code-block:: bash
+
+    rllib train --env=PongDeterministic-v4 \
+        --run=A2C --config '{"num_workers": 2, "monitor": true}'
+
+    # videos will be saved in the ~/ray_results/<experiment> dir, for example
+    openaigym.video.0.31401.video000000.meta.json
+    openaigym.video.0.31401.video000000.mp4
+    openaigym.video.0.31403.video000000.meta.json
+    openaigym.video.0.31403.video000000.mp4
+
+Log Verbosity
+~~~~~~~~~~~~~
+
+You can control the agent log level via the ``"log_level"`` flag. Valid values are "INFO" (default), "DEBUG", "WARN", and "ERROR". This can be used to increase or decrease the verbosity of internal logging. For example:
+
+.. code-block:: bash
+
+    rllib train --env=PongDeterministic-v4 \
+        --run=A2C --config '{"num_workers": 2, "log_level": "DEBUG"}'
+
+Stack Traces
+~~~~~~~~~~~~
+
+You can use the ``ray stack`` command to dump the stack traces of all the Python workers on a single node. This can be useful for debugging unexpected hangs or performance issues.
 
 REST API
 --------
 
-In some cases (i.e., when interacting with an external environment) it makes more sense to interact with RLlib as if were an independently running service, rather than RLlib hosting the simulations itself. This is possible via RLlib's serving env `interface <rllib-envs.html#serving>`__.
+In some cases (i.e., when interacting with an externally hosted simulator or production environment) it makes more sense to interact with RLlib as if were an independently running service, rather than RLlib hosting the simulations itself. This is possible via RLlib's external agents `interface <rllib-env.html#interfacing-with-external-agents>`__.
 
 .. autoclass:: ray.rllib.utils.policy_client.PolicyClient
     :members:
diff --git a/doc/source/rllib.rst b/doc/source/rllib.rst
index ea5bbbf583810..e96bd6fccbcb9 100644
--- a/doc/source/rllib.rst
+++ b/doc/source/rllib.rst
@@ -10,14 +10,14 @@ Learn more about RLlib's design by reading the `ICML paper <https://arxiv.org/ab
 Installation
 ------------
 
-RLlib has extra dependencies on top of ``ray``. First, you'll need to install either `PyTorch <http://pytorch.org/>`__ or `TensorFlow <https://www.tensorflow.org>`__. Then, install the Ray RLlib module:
+RLlib has extra dependencies on top of ``ray``. First, you'll need to install either `PyTorch <http://pytorch.org/>`__ or `TensorFlow <https://www.tensorflow.org>`__. Then, install the RLlib module:
 
 .. code-block:: bash
 
   pip install tensorflow  # or tensorflow-gpu
-  pip install ray[rllib]
+  pip install ray[rllib]  # also recommended: ray[debug]
 
-You might also want to clone the Ray repo for convenient access to RLlib helper scripts:
+You might also want to clone the `Ray repo <https://github.com/ray-project/ray>`__ for convenient access to RLlib helper scripts:
 
 .. code-block:: bash
 
@@ -27,7 +27,9 @@ You might also want to clone the Ray repo for convenient access to RLlib helper
 Training APIs
 -------------
 * `Command-line <rllib-training.html>`__
+* `Configuration <rllib-training.html#configuration>`__
 * `Python API <rllib-training.html#python-api>`__
+* `Debugging <rllib-training.html#debugging>`__
 * `REST API <rllib-training.html#rest-api>`__
 
 Environments
@@ -36,8 +38,7 @@ Environments
 * `OpenAI Gym <rllib-env.html#openai-gym>`__
 * `Vectorized <rllib-env.html#vectorized>`__
 * `Multi-Agent <rllib-env.html#multi-agent>`__
-* `Agent-Driven <rllib-env.html#agent-driven>`__
-* `Offline Data Ingest <rllib-env.html#offline-data>`__ 
+* `Interfacing with External Agents <rllib-env.html#interfacing-with-external-agents>`__
 * `Batch Asynchronous <rllib-env.html#batch-asynchronous>`__
 
 Algorithms
@@ -53,9 +54,9 @@ Algorithms
 
    -  `Advantage Actor-Critic (A2C, A3C) <rllib-algorithms.html#advantage-actor-critic-a2c-a3c>`__
 
-   -  `Deep Deterministic Policy Gradients (DDPG) <rllib-algorithms.html#deep-deterministic-policy-gradients-ddpg>`__
+   -  `Deep Deterministic Policy Gradients (DDPG, TD3) <rllib-algorithms.html#deep-deterministic-policy-gradients-ddpg-td3>`__
 
-   -  `Deep Q Networks (DQN, Rainbow) <rllib-algorithms.html#deep-q-networks-dqn-rainbow>`__
+   -  `Deep Q Networks (DQN, Rainbow, Parametric DQN) <rllib-algorithms.html#deep-q-networks-dqn-rainbow-parametric-dqn>`__
 
    -  `Policy Gradients <rllib-algorithms.html#policy-gradients>`__
 
@@ -74,6 +75,7 @@ Models and Preprocessors
 * `Custom Models <rllib-models.html#custom-models>`__
 * `Custom Preprocessors <rllib-models.html#custom-preprocessors>`__
 * `Customizing Policy Graphs <rllib-models.html#customizing-policy-graphs>`__
+* `Variable-length / Parametric Action Spaces <rllib-models.html#variable-length-parametric-action-spaces>`__
 * `Model-Based Rollouts <rllib-models.html#model-based-rollouts>`__
 
 RLlib Concepts
@@ -98,3 +100,6 @@ If you encounter errors like
 `blas_thread_init: pthread_create: Resource temporarily unavailable` when using many workers,
 try setting ``OMP_NUM_THREADS=1``. Similarly, check configured system limits with
 `ulimit -a` for other resource limit errors.
+
+For debugging unexpected hangs or performance problems, you can run ``ray stack`` to dump
+the stack traces of all Ray workers on the current node. This requires py-spy to be installed.
diff --git a/doc/source/security.rst b/doc/source/security.rst
new file mode 100644
index 0000000000000..6b636c66858e2
--- /dev/null
+++ b/doc/source/security.rst
@@ -0,0 +1,55 @@
+Security
+========
+
+This document describes best security practices for using Ray.
+
+Intended Use and Threat Model
+-----------------------------
+
+Ray instances should run on a secure network without public facing ports.
+The most common threat for Ray instances is unauthorized access to Redis,
+which can be exploited to gain shell access and run arbitray code.
+The best fix is to run Ray instances on a secure, trusted network.
+
+Running Ray on a secured network is not always feasible, so Ray
+provides some basic security features:
+
+
+Redis Port Authentication
+-------------------------
+
+To prevent exploits via unauthorized Redis access, Ray provides the option to
+password-protect Redis ports. While this is not a replacement for running Ray
+behind a firewall, this feature is useful for instances exposed to the internet
+where configuring a firewall is not possible. Because Redis is
+very fast at serving queries, the chosen password should be long.
+
+Redis authentication is only supported on the raylet code path.
+
+To add authentication via the Python API, start Ray using:
+
+.. code-block:: python
+
+  ray.init(redis_password="password")
+
+To add authentication via the CLI, or connect to an existing Ray instance with
+password-protected Redis ports:
+
+.. code-block:: bash
+
+  ray start [--head] --redis-password="password"
+
+While Redis port authentication may protect against external attackers,
+Ray does not encrypt traffic between nodes so man-in-the-middle attacks are
+possible for clusters on untrusted networks.
+
+Cloud Security
+--------------
+
+Launching Ray clusters on AWS or GCP using the ``ray up`` command
+automatically configures security groups that prevent external Redis access.
+
+References
+----------
+
+- The `Redis security documentation <https://redis.io/topics/security>`
diff --git a/doc/source/sgd.png b/doc/source/sgd.png
new file mode 100644
index 0000000000000..aed38161cb159
Binary files /dev/null and b/doc/source/sgd.png differ
diff --git a/doc/source/tempfile.rst b/doc/source/tempfile.rst
new file mode 100644
index 0000000000000..d68e835e0261b
--- /dev/null
+++ b/doc/source/tempfile.rst
@@ -0,0 +1,86 @@
+Temporary Files
+===============
+
+Ray will produce some temporary files during running.
+They are useful for logging, debugging & sharing object store with other programs.
+
+Location of Temporary Files
+---------------------------
+
+First we introduce the concept of a session of Ray.
+
+A session contains a set of processes. A session is created by executing
+``ray start`` command or call ``ray.init()`` in a Python script and ended by
+executing ``ray stop`` or call ``ray.shutdown()``.
+
+For each session, Ray will create a *root temporary directory* to place all its
+temporary files. The path is ``/tmp/ray/session_{datetime}_{pid}`` by default.
+The pid belongs to the startup process (the process calling ``ray.init()`` or
+the Ray process executed by a shell in ``ray start``).
+You can sort by their names to find the latest session.
+
+You are allowed to change the *root temporary directory* in one of these ways:
+
+* Pass ``--temp-dir={your temp path}`` to ``ray start``
+* Specify ``temp_dir`` when call ``ray.init()``
+
+You can also use ``default_worker.py --temp-dir={your temp path}`` to
+start a new worker with given *root temporary directory*.
+
+The *root temporary directory* you specified will be given as it is,
+without pids or datetime attached.
+
+Layout of Temporary Files
+-------------------------
+
+A typical layout of temporary files could look like this:
+
+.. code-block:: text
+
+  /tmp
+  └── ray
+      └── session_{datetime}_{pid}
+          ├── logs  # for logging
+          │   ├── log_monitor.err
+          │   ├── log_monitor.out
+          │   ├── monitor.err
+          │   ├── monitor.out
+          │   ├── plasma_store_0.err  # array of plasma stores' outputs
+          │   ├── plasma_store_0.out
+          │   ├── raylet_0.err  # array of raylets' outputs. Control it with `--no-redirect-worker-output` (in Ray's command line) or `redirect_worker_output` (in ray.init())
+          │   ├── raylet_0.out
+          │   ├── redis-shard_0.err   # array of redis shards' outputs
+          │   ├── redis-shard_0.out
+          │   ├── redis.err  # redis
+          │   ├── redis.out
+          │   ├── webui.err  # ipython notebook web ui
+          │   ├── webui.out
+          │   ├── worker-{worker_id}.err  # redirected output of workers
+          │   ├── worker-{worker_id}.out
+          │   └── {other workers}
+          ├── ray_ui.ipynb  # ipython notebook file
+          └── sockets  # for sockets
+              ├── plasma_store
+              └── raylet  # this could be deleted by Ray's shutdown cleanup.
+
+
+Plasma Object Store Socket
+--------------------------
+
+Plasma object store sockets can be used to share objects with other programs using Apache Arrow.
+
+You are allowed to specify the plasma object store socket in one of these ways:
+
+* Pass ``--plasma-store-socket-name={your socket path}`` to ``ray start``
+* Specify ``plasma_store_socket_name`` when call ``ray.init()``
+
+The path you specified will be given as it is without being affected any other paths.
+
+
+Notes
+-----
+
+Temporary file policies are defined in ``python/ray/tempfile_services.py``.
+
+Currently, we keep ``/tmp/ray`` as the default directory for temporary data files of RLlib as before.
+It is not very reasonable and could be changed later.
diff --git a/doc/source/troubleshooting.rst b/doc/source/troubleshooting.rst
index ff4b3039e8c15..86f56e7755957 100644
--- a/doc/source/troubleshooting.rst
+++ b/doc/source/troubleshooting.rst
@@ -61,10 +61,10 @@ of the following reasons.
 - **Stressful workloads:** Workloads that create many many tasks in a short
   amount of time can sometimes interfere with the heartbeat mechanism that we
   use to check that processes are still alive. On the head node in the cluster,
-  you can check the files ``/tmp/raylogs/monitor-******.out`` and
-  ``/tmp/raylogs/monitor-******.err``. They will indicate which processes Ray
-  has marked as dead (due to a lack of heartbeats). However, it is currently
-  possible for a process to get marked as dead without actually having died.
+  you can check the files ``/tmp/ray/session_*/logs/monitor*``. They will
+  indicate which processes Ray has marked as dead (due to a lack of heartbeats).
+  However, it is currently possible for a process to get marked as dead without
+  actually having died.
 
 - **Starting many actors:** Workloads that start a large number of actors all at
   once may exhibit problems when the processes (or libraries that they use)
@@ -92,6 +92,11 @@ of the following reasons.
 Hanging
 -------
 
+.. tip::
+    
+    You can run ``ray stack`` to dump the stack traces of all Ray workers on
+    the current node. This requires py-spy to be installed.
+
 If a workload is hanging and not progressing, the problem may be one of the
 following.
 
diff --git a/doc/source/tune-examples.rst b/doc/source/tune-examples.rst
new file mode 100644
index 0000000000000..e0af86bcb6956
--- /dev/null
+++ b/doc/source/tune-examples.rst
@@ -0,0 +1,62 @@
+Tune Examples
+=============
+
+.. Keep this in sync with ray/python/ray/tune/examples/README.rst
+
+In our repository, we provide a variety of examples for the various use cases and features of Tune.
+
+If any example is broken, or if you'd like to add an example to this page, feel free to raise an issue on our Github repository.
+
+
+General Examples
+----------------
+
+- `async_hyperband_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/async_hyperband_example.py>`__:
+   Example of using a Trainable class with AsyncHyperBandScheduler.
+- `hyperband_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/hyperband_example.py>`__:
+   Example of using a Trainable class with HyperBandScheduler. Also uses the Experiment class API for specifying the experiment configuration.
+- `hyperopt_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/hyperopt_example.py>`__:
+   Optimizes a basic function using the function-based API and the HyperOptSearch (SearchAlgorithm wrapper for HyperOpt TPE).
+   Also uses the AsyncHyperBandScheduler.
+- `pbt_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/pbt_example.py>`__:
+   Example of using a Trainable class with PopulationBasedTraining scheduler.
+- `pbt_ppo_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/pbt_ppo_example.py>`__:
+   Example of optimizing a distributed RLlib algorithm (PPO) with the PopulationBasedTraining scheduler.
+
+
+Keras Examples
+--------------
+
+- `tune_mnist_keras <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/tune_mnist_keras.py>`__:
+   Converts the Keras MNIST example to use Tune with the function-based API and a Keras callback. Also shows how to easily convert something relying on argparse to use Tune.
+
+
+PyTorch Examples
+----------------
+
+- `mnist_pytorch <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/mnist_pytorch.py>`__:
+   Converts the PyTorch MNIST example to use Tune with the function-based API. Also shows how to easily convert something relying on argparse to use Tune.
+- `mnist_pytorch_trainable <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/mnist_pytorch_trainable.py>`__:
+   Converts the PyTorch MNIST example to use Tune with Trainable API. Also uses the HyperBandScheduler and checkpoints the model at the end.
+
+
+TensorFlow Examples
+-------------------
+
+- `tune_mnist_ray <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/tune_mnist_ray.py>`__:
+   A basic example of tuning a TensorFlow model on MNIST using the Trainable class.
+- `tune_mnist_ray_hyperband <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/tune_mnist_ray_hyperband.py>`__:
+   A basic example of tuning a TensorFlow model on MNIST using the Trainable class and the HyperBand scheduler.
+- `tune_mnist_async_hyperband <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/tune_mnist_async_hyperband.py>`__:
+   Example of tuning a TensorFlow model on MNIST using AsyncHyperBand.
+
+
+Contributed Examples
+--------------------
+
+- `pbt_tune_cifar10_with_keras <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/pbt_tune_cifar10_with_keras.py>`__:
+   A contributed example of tuning a Keras model on CIFAR10 with the PopulationBasedTraining scheduler.
+- `genetic_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/genetic_example.py>`__:
+   Optimizing the michalewicz function using the contributed GeneticSearch search algorithm with AsyncHyperBandScheduler.
+
+
diff --git a/doc/source/tune-package-ref.rst b/doc/source/tune-package-ref.rst
index d6f13cd981556..e7f3d3167adab 100644
--- a/doc/source/tune-package-ref.rst
+++ b/doc/source/tune-package-ref.rst
@@ -12,6 +12,11 @@ ray.tune
     :members:
     :private-members:
 
+
+.. autoclass:: ray.tune.function_runner.StatusReporter
+    :members: __call__
+
+
 ray.tune.schedulers
 -------------------
 
@@ -24,7 +29,7 @@ ray.tune.suggest
 
 .. automodule:: ray.tune.suggest
     :members:
-    :exclude-members: function, grid_search, SuggestionAlgorithm
+    :exclude-members: function, sample_from, grid_search, SuggestionAlgorithm
     :show-inheritance:
 
 .. autoclass:: ray.tune.suggest.SuggestionAlgorithm
diff --git a/doc/source/tune-searchalg.rst b/doc/source/tune-searchalg.rst
index 97e8ce1bc295c..e8e5b0fa672ef 100644
--- a/doc/source/tune-searchalg.rst
+++ b/doc/source/tune-searchalg.rst
@@ -25,10 +25,13 @@ By default, Tune uses the `default search space and variant generation process <
     :noindex:
 
 
+Note that other search algorithms will not necessarily extend this class and may require a different search space declaration than the default Tune format.
+
 HyperOpt Search (Tree-structured Parzen Estimators)
 ---------------------------------------------------
 
-The ``HyperOptSearch`` is a SearchAlgorithm that is backed by `HyperOpt <http://hyperopt.github.io/hyperopt>`__ to perform sequential model-based hyperparameter optimization.
+The ``HyperOptSearch`` is a SearchAlgorithm that is backed by `HyperOpt <http://hyperopt.github.io/hyperopt>`__ to perform sequential model-based hyperparameter optimization. Note that this class does not extend ``ray.tune.suggest.BasicVariantGenerator``, so you will not be able to use Tune's default variant generation/search space declaration when using HyperOptSearch.
+
 In order to use this search algorithm, you will need to install HyperOpt via the following command:
 
 .. code-block:: bash
@@ -47,7 +50,6 @@ An example of this can be found in `hyperopt_example.py <https://github.com/ray-
     :show-inheritance:
     :noindex:
 
-
 Contributing a New Algorithm
 ----------------------------
 
diff --git a/doc/source/tune-usage.rst b/doc/source/tune-usage.rst
index d485dcdd02380..5cc11b3c16814 100644
--- a/doc/source/tune-usage.rst
+++ b/doc/source/tune-usage.rst
@@ -8,10 +8,7 @@ Tune Overview
 
 Tune schedules a number of *trials* in a cluster. Each trial runs a user-defined Python function or class and is parameterized either by a *config* variation from Tune's Variant Generator or a user-specified **search algorithm**. The trials are scheduled and managed by a **trial scheduler**.
 
-More information about Tune's `search algorithms can be found here <tune-searchalg.html>`__.
-
-More information about Tune's `trial schedulers can be found here <tune-schedulers.html>`__.
-
+More information about Tune's `search algorithms can be found here <tune-searchalg.html>`__. More information about Tune's `trial schedulers can be found here <tune-schedulers.html>`__.
 
 Start by installing, importing, and initializing Ray.
 
@@ -22,29 +19,48 @@ Start by installing, importing, and initializing Ray.
 
     ray.init()
 
-Tune provides a ``run_experiments`` function that generates and runs the trials as described by the `experiment specification <tune-usage.html#experiment-configuration>`__.
 
-.. autofunction:: ray.tune.run_experiments
-    :noindex:
+Experiment Configuration
+------------------------
 
-This function will report status on the command line until all Trials stop:
+This section will cover the main steps needed to modify your code to run Tune: using the `Training API <tune-usage.html#training-api>`__ and  `executing your Tune experiment <tune-usage.html#specifying-experiments>`__.
 
-::
+You can checkout out our `examples page <tune-examples.html>`__ for more code examples.
 
-    == Status ==
-    Using FIFO scheduling algorithm.
-    Resources used: 4/8 CPUs, 0/0 GPUs
-    Result logdir: ~/ray_results/my_experiment
-     - train_func_0_lr=0.2,momentum=1:  RUNNING [pid=6778], 209 s, 20604 ts, 7.29 acc
-     - train_func_1_lr=0.4,momentum=1:  RUNNING [pid=6780], 208 s, 20522 ts, 53.1 acc
-     - train_func_2_lr=0.6,momentum=1:  TERMINATED [pid=6789], 21 s, 2190 ts, 100 acc
-     - train_func_3_lr=0.2,momentum=2:  RUNNING [pid=6791], 208 s, 41004 ts, 8.37 acc
-     - train_func_4_lr=0.4,momentum=2:  RUNNING [pid=6800], 209 s, 41204 ts, 70.1 acc
-     - train_func_5_lr=0.6,momentum=2:  TERMINATED [pid=6809], 10 s, 2164 ts, 100 acc
+Training API
+~~~~~~~~~~~~
 
+Training can be done with either the **function-based API** or **Trainable API**.
+
+**Python functions** will need to have the following signature:
+
+.. code-block:: python
+
+    def trainable(config, reporter):
+        """
+        Args:
+            config (dict): Parameters provided from the search algorithm
+                or variant generation.
+            reporter (Reporter): Handle to report intermediate metrics to Tune.
+        """
+
+        while True:
+            # ...
+            reporter(**kwargs)
+
+The reporter will allow you to report metrics used for scheduling, search, or early stopping.
+
+Tune will run this function on a separate thread in a Ray actor process. Note that this API is not checkpointable, since the thread will never return control back to its caller. The reporter documentation can be `found here <tune-package-ref.html#ray.tune.function_runner.StatusReporter>`__.
+
+.. note::
+    If you have a lambda function that you want to train, you will need to first register the function: ``tune.register_trainable("lambda_id", lambda x: ...)``. You can then use ``lambda_id`` in place of ``my_trainable``.
+
+**Python classes** passed into Tune will need to subclass ``ray.tune.Trainable``. The Trainable interface `can be found here <tune-package-ref.html#ray.tune.Trainable>`__.
+
+Both the Trainable and function-based API will have `autofilled metrics <tune-usage.html#auto-filled-results>`__ in addition to the metrics reported.
+
+See the `experiment specification <tune-usage.html#specifying-experiments>`__ section on how to specify and execute your training.
 
-Experiment Configuration
-------------------------
 
 Specifying Experiments
 ~~~~~~~~~~~~~~~~~~~~~~
@@ -79,54 +95,33 @@ dictionary. Tune will convert the dict into an ``ray.tune.Experiment`` object.
             "max_failures": 2
         }
     }
-    run_experiments(experiment_spec)
-
-
-An example of this can be found in `async_hyperband_example.py <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/async_hyperband_example.py>`__.
-
-Model API
-~~~~~~~~~
-
-You can either pass in a Python function or Python class for model training as follows, each requiring a specific signature/interface:
-
-.. code-block:: python
-   :emphasize-lines: 3,8
-
-    experiment_spec = {
-        "my_experiment_name": {
-            "run": my_trainable
-        }
-    }
 
-    # or with the Experiment API
-    experiment_spec = Experiment("my_experiment_name", my_trainable)
+Tune provides a ``run_experiments`` function that generates and runs the trials.
 
-    run_experiments(experiments=experiment_spec)
-
-
-**Python functions** will need to have the following signature:
+.. autofunction:: ray.tune.run_experiments
+    :noindex:
 
-.. code-block:: python
+This function will report status on the command line until all Trials stop:
 
-    def trainable(config, reporter):
-        """
-        Args:
-            config (dict): Parameters provided from the search algorithm
-                or variant generation.
-            reporter (Reporter): Handle to report intermediate metrics to Tune.
-        """
+::
 
-Tune will run this function on a separate thread in a Ray actor process. Note that trainable functions are not checkpointable, since they never return control back to their caller. See `Trial Checkpointing for more details <tune-usage.html#trial-checkpointing>`__.
+    == Status ==
+    Using FIFO scheduling algorithm.
+    Resources used: 4/8 CPUs, 0/0 GPUs
+    Result logdir: ~/ray_results/my_experiment
+     - train_func_0_lr=0.2,momentum=1:  RUNNING [pid=6778], 209 s, 20604 ts, 7.29 acc
+     - train_func_1_lr=0.4,momentum=1:  RUNNING [pid=6780], 208 s, 20522 ts, 53.1 acc
+     - train_func_2_lr=0.6,momentum=1:  TERMINATED [pid=6789], 21 s, 2190 ts, 100 acc
+     - train_func_3_lr=0.2,momentum=2:  RUNNING [pid=6791], 208 s, 41004 ts, 8.37 acc
+     - train_func_4_lr=0.4,momentum=2:  RUNNING [pid=6800], 209 s, 41204 ts, 70.1 acc
+     - train_func_5_lr=0.6,momentum=2:  TERMINATED [pid=6809], 10 s, 2164 ts, 100 acc
 
-.. note::
-    If you have a lambda function that you want to train, you will need to first register the function: ``tune.register_trainable("lambda_id", lambda x: ...)``. You can then use ``lambda_id`` in place of ``my_trainable``.
 
-**Python classes** passed into Tune will need to subclass ``ray.tune.Trainable``.
+An example of this can be found in `async_hyperband_example.py <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/async_hyperband_example.py>`__.
 
-.. autoclass:: ray.tune.Trainable
-    :members: __init__, _save, _restore, _train, _setup, _stop
-    :noindex:
 
+Training Features
+-----------------
 
 Tune Search Space (Default)
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -134,6 +129,9 @@ Tune Search Space (Default)
 
 You can use ``tune.grid_search`` to specify an axis of a grid search. By default, Tune also supports sampling parameters from user-specified lambda functions, which can be used independently or in combination with grid search.
 
+.. note::
+    If you specify an explicit Search Algorithm such as any SuggestionAlgorithm, you may not be able to specify lambdas or grid search with this interface, as the search algorithm may require a different search space declaration.
+
 The following shows grid search over two nested parameters combined with random sampling from two lambda functions, generating 9 different trials. Note that the value of ``beta`` depends on the value of ``alpha``, which is represented by referencing ``spec.config.alpha`` in the lambda function. This lets you specify conditional parameter distributions.
 
 .. code-block:: python
@@ -143,8 +141,8 @@ The following shows grid search over two nested parameters combined with random
         "my_experiment_name": {
             "run": my_trainable,
             "config": {
-                "alpha": lambda spec: np.random.uniform(100),
-                "beta": lambda spec: spec.config.alpha * np.random.normal(),
+                "alpha": tune.sample_from(lambda spec: np.random.uniform(100)),
+                "beta": tune.sample_from(lambda spec: spec.config.alpha * np.random.normal()),
                 "nn_layers": [
                     tune.grid_search([16, 64, 256]),
                     tune.grid_search([16, 64, 256]),
@@ -155,10 +153,7 @@ The following shows grid search over two nested parameters combined with random
 
 
 .. note::
-    Lambda functions will be evaluated during trial variant generation. If you need to pass a literal function in your config, use ``tune.function(...)`` to escape it.
-
-.. warning::
-    If you specify a Search Algorithm, you may not be able to use this feature, as the algorithm may require a different search space declaration.
+    Use ``tune.sample_from(...)`` to sample from a function during trial variant generation. If you need to pass a literal function in your config, use ``tune.function(...)`` to escape it.
 
 For more information on variant generation, see `basic_variant.py <https://github.com/ray-project/ray/blob/master/python/ray/tune/suggest/basic_variant.py>`__.
 
@@ -174,8 +169,8 @@ By default, each random variable and grid search point is sampled once. To take
         "my_experiment_name": {
             "run": my_trainable,
             "config": {
-                "alpha": lambda spec: np.random.uniform(100),
-                "beta": lambda spec: spec.config.alpha * np.random.normal(),
+                "alpha": tune.sample_from(lambda spec: np.random.uniform(100)),
+                "beta": tune.sample_from(lambda spec: spec.config.alpha * np.random.normal()),
                 "nn_layers": [
                     tune.grid_search([16, 64, 256]),
                     tune.grid_search([16, 64, 256]),
@@ -193,9 +188,12 @@ Using GPUs (Resource Allocation)
 
 Tune will allocate the specified GPU and CPU ``trial_resources`` to each individual trial (defaulting to 1 CPU per trial). Under the hood, Tune runs each trial as a Ray actor, using Ray's resource handling to allocate resources and place actors. A trial will not be scheduled unless at least that amount of resources is available in the cluster, preventing the cluster from being overloaded.
 
+Fractional values are also supported, (i.e., ``"gpu": 0.2``). You can find an example of this in the `Keras MNIST example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/tune_mnist_keras.py>`__.
+
 If GPU resources are not requested, the ``CUDA_VISIBLE_DEVICES`` environment variable will be set as empty, disallowing GPU access.
 Otherwise, it will be set to the GPUs in the list (this is managed by Ray).
 
+
 If your trainable function / class creates further Ray actors or tasks that also consume CPU / GPU resources, you will also want to set ``extra_cpu`` or ``extra_gpu`` to reserve extra resource slots for the actors you will create. For example, if a trainable class requires 1 GPU itself, but will launch 4 actors each using another GPU, then it should set ``"gpu": 1, "extra_gpu": 4``.
 
 .. code-block:: python
@@ -216,14 +214,14 @@ If your trainable function / class creates further Ray actors or tasks that also
 Trial Checkpointing
 ~~~~~~~~~~~~~~~~~~~
 
-To enable checkpointing, you must implement a `Trainable class <tune-usage.html#model-api>`__ (Trainable functions are not checkpointable, since they never return control back to their caller). The easiest way to do this is to subclass the pre-defined ``Trainable`` class and implement its ``_train``, ``_save``, and ``_restore`` abstract methods `(example) <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/hyperband_example.py>`__. Implementing this interface is required to support resource multiplexing in  Trial Schedulers such as HyperBand and PBT.
+To enable checkpointing, you must implement a `Trainable class <tune-usage.html#training-api>`__ (Trainable functions are not checkpointable, since they never return control back to their caller). The easiest way to do this is to subclass the pre-defined ``Trainable`` class and implement its ``_train``, ``_save``, and ``_restore`` abstract methods `(example) <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/hyperband_example.py>`__. Implementing this interface is required to support resource multiplexing in  Trial Schedulers such as HyperBand and PBT.
 
 For TensorFlow model training, this would look something like this `(full tensorflow example) <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/tune_mnist_ray_hyperband.py>`__:
 
 .. code-block:: python
 
     class MyClass(Trainable):
-        def _setup(self):
+        def _setup(self, config):
             self.saver = tf.train.Saver()
             self.sess = ...
             self.iteration = 0
@@ -297,6 +295,28 @@ You often will want to compute a large object (e.g., training data, model weight
         }
     })
 
+Auto-Filled Results
+-------------------
+
+During training, Tune will automatically fill certain fields if not already provided. All of these can be used as stopping conditions or in the Scheduler/Search Algorithm specification.
+
+.. literalinclude:: ../../python/ray/tune/result.py
+   :language: python
+   :start-after: __sphinx_doc_begin__
+   :end-before: __sphinx_doc_end__
+
+The following fields will automatically show up on the console output, if provided:
+
+1. ``episode_reward_mean``
+2. ``mean_loss``
+3. ``mean_accuracy``
+4. ``timesteps_this_iter`` (aggregated into ``timesteps_total``).
+
+.. code-block:: bash
+
+    Example_0:  TERMINATED [pid=68248], 179 s, 2 iter, 60000 ts, 94 rew
+
+
 
 Logging and Visualizing Results
 -------------------------------
@@ -360,12 +380,6 @@ Then, on the client side, you can use the following class. The server address de
 For an example notebook for using the Client API, see the `Client API Example <https://github.com/ray-project/ray/tree/master/python/ray/tune/TuneClient.ipynb>`__.
 
 
-Examples
---------
-
-You can find a comprehensive of examples `using Tune and its various features here <https://github.com/ray-project/ray/tree/master/python/ray/tune/examples>`__, including examples using Keras, TensorFlow, and Population-Based Training.
-
-
 Further Questions or Issues?
 ----------------------------
 
diff --git a/doc/source/tune.rst b/doc/source/tune.rst
index a849f3b811d58..14c95fb0edcb0 100644
--- a/doc/source/tune.rst
+++ b/doc/source/tune.rst
@@ -7,7 +7,10 @@ Tune: Scalable Hyperparameter Search
 
 Tune is a scalable framework for hyperparameter search with a focus on deep learning and deep reinforcement learning.
 
-You can find the code for Tune `here on GitHub <https://github.com/ray-project/ray/tree/master/python/ray/tune>`__.
+You can find the code for Tune `here on GitHub <https://github.com/ray-project/ray/tree/master/python/ray/tune>`__. To get started with Tune, try going through `our tutorial of using Tune with Keras <https://github.com/ray-project/tutorial/blob/master/tune_exercises/Tune.ipynb>`__.
+
+(Experimental): You can try out `the above tutorial on a free hosted server via Binder <https://mybinder.org/v2/gh/ray-project/tutorial/master?filepath=tune_exercises%2FTune.ipynb>`__.
+
 
 Features
 --------
@@ -42,7 +45,7 @@ You'll need to first `install ray <installation.html>`__ to import Tune.
 
 .. code-block:: bash
 
-    pip install ray
+    pip install ray  # also recommended: ray[debug]
 
 
 Quick Start
diff --git a/doc/source/tutorial.rst b/doc/source/tutorial.rst
index 0493b69169909..81de87a571ced 100644
--- a/doc/source/tutorial.rst
+++ b/doc/source/tutorial.rst
@@ -9,7 +9,7 @@ To use Ray, you need to understand the following:
 Overview
 --------
 
-Ray is a Python-based distributed execution engine. The same code can be run on
+Ray is a distributed execution engine. The same code can be run on
 a single machine to achieve efficient multiprocessing, and it can be used on a
 cluster for large computations.
 
@@ -21,8 +21,6 @@ When using Ray, several processes are involved.
   allows workers to efficiently share objects on the same node with minimal
   copying and deserialization.
 - One **local scheduler** per node assigns tasks to workers on the same node.
-- A **global scheduler** receives tasks from local schedulers and assigns them
-  to other local schedulers.
 - A **driver** is the Python process that the user controls. For example, if the
   user is running a script or using a Python shell, then the driver is the Python
   process that runs the script or the shell. A driver is similar to a worker in
diff --git a/doc/source/user-profiling.rst b/doc/source/user-profiling.rst
index e7c18dd5ee737..cdbabff391884 100644
--- a/doc/source/user-profiling.rst
+++ b/doc/source/user-profiling.rst
@@ -1,11 +1,11 @@
 Profiling for Ray Users
 =======================
 
-This document is intended for users of Ray who want to know how to evaluate 
-the performance of their code while running on Ray. Profiling the 
-performance of your code can be very helpful to determine performance 
-bottlenecks or to find out where your code may not be parallelized properly. 
-If you are interested in pinpointing why your Ray application may not be 
+This document is intended for users of Ray who want to know how to evaluate
+the performance of their code while running on Ray. Profiling the
+performance of your code can be very helpful to determine performance
+bottlenecks or to find out where your code may not be parallelized properly.
+If you are interested in pinpointing why your Ray application may not be
 achieving the expected speedup, read on!
 
 
@@ -28,26 +28,26 @@ let's define our remote function to just sleep for 0.5 seconds:
   def func():
       time.sleep(0.5)
 
-In our example setup, we wish to call our remote function ``func()`` five 
-times, and store the result of each call into a list. To compare the 
-performance of different ways of looping our calls to our remote function, 
+In our example setup, we wish to call our remote function ``func()`` five
+times, and store the result of each call into a list. To compare the
+performance of different ways of looping our calls to our remote function,
 we can define each loop version as a separate function on the driver script.
 
-For the first version **ex1**, each iteration of the loop calls the remote 
-function, then calls ``ray.get`` in an attempt to store the current result 
+For the first version **ex1**, each iteration of the loop calls the remote
+function, then calls ``ray.get`` in an attempt to store the current result
 into the list, as follows:
 
 .. code-block:: python
 
   # This loop is suboptimal in Ray, and should only be used for the sake of this example
-  def ex1():  
+  def ex1():
       list1 = []
       for i in range(5):
           list1.append(ray.get(func.remote()))
 
-For the second version **ex2**, each iteration of the loop calls the remote 
-function, and stores it into the list **without** calling ``ray.get`` each time. 
-``ray.get`` is used after the loop has finished, in preparation for processing 
+For the second version **ex2**, each iteration of the loop calls the remote
+function, and stores it into the list **without** calling ``ray.get`` each time.
+``ray.get`` is used after the loop has finished, in preparation for processing
 ``func()``'s results:
 
 .. code-block:: python
@@ -59,8 +59,8 @@ function, and stores it into the list **without** calling ``ray.get`` each time.
           list2.append(func.remote())
       ray.get(list2)
 
-Finally, for an example that's not so parallelizable, let's create a 
-third version **ex3** where the driver has to call a local 
+Finally, for an example that's not so parallelizable, let's create a
+third version **ex3** where the driver has to call a local
 function in between each call to the remote function ``func()``:
 
 .. code-block:: python
@@ -81,14 +81,14 @@ Timing Performance Using Python's Timestamps
 --------------------------------------------
 
 One way to sanity-check the performance of the three loops is simply to
-time how long it takes to complete each loop version. We can do this using 
+time how long it takes to complete each loop version. We can do this using
 python's built-in ``time`` `module`_.
 
 .. _`module`: https://docs.python.org/3/library/time.html
 
-The ``time`` module contains a useful ``time()`` function that returns the 
-current timestamp in unix time whenever it's called. We can create a generic 
-function wrapper to call ``time()`` right before and right after each loop 
+The ``time`` module contains a useful ``time()`` function that returns the
+current timestamp in unix time whenever it's called. We can create a generic
+function wrapper to call ``time()`` right before and right after each loop
 function to print out how long each loop takes overall:
 
 .. code-block:: python
@@ -106,8 +106,8 @@ function to print out how long each loop takes overall:
           return result
       return timed_wrapper
 
-To always print out how long the loop takes to run each time the loop 
-function ``ex1()`` is called, we can evoke our ``time_this`` wrapper with 
+To always print out how long the loop takes to run each time the loop
+function ``ex1()`` is called, we can evoke our ``time_this`` wrapper with
 a function decorator. This can similarly be done to functions ``ex2()``
 and ``ex3()``:
 
@@ -136,9 +136,9 @@ Then, running the three timed loops should yield output similar to this:
   | func:'ex2' args:[(), {}] took: 1.0032 seconds |
   | func:'ex3' args:[(), {}] took: 2.0039 seconds |
 
-Let's interpret these results. 
+Let's interpret these results.
 
-Here, ``ex1()`` took substantially more time than ``ex2()``, where 
+Here, ``ex1()`` took substantially more time than ``ex2()``, where
 their only difference is that ``ex1()`` calls ``ray.get`` on the remote
 function before adding it to the list, while ``ex2()`` waits to fetch the
 entire list with ``ray.get`` at once.
@@ -160,28 +160,28 @@ entire list with ``ray.get`` at once.
           list2.append(func.remote())
       ray.get(list2)
 
-Notice how ``ex1()`` took 2.5 seconds, exactly five times 0.5 seconds, or 
-the time it would take to wait for our remote function five times in a row. 
+Notice how ``ex1()`` took 2.5 seconds, exactly five times 0.5 seconds, or
+the time it would take to wait for our remote function five times in a row.
 
-By calling ``ray.get`` after each call to the remote function, ``ex1()`` 
-removes all ability to parallelize work, by forcing the driver to wait for 
-each ``func()``'s result in succession. We are not taking advantage of Ray 
-parallelization here! 
+By calling ``ray.get`` after each call to the remote function, ``ex1()``
+removes all ability to parallelize work, by forcing the driver to wait for
+each ``func()``'s result in succession. We are not taking advantage of Ray
+parallelization here!
 
-Meanwhile, ``ex2()`` takes about 1 second, much faster than it would normally 
-take to call ``func()`` five times iteratively. Ray is running each call to 
-``func()`` in parallel, saving us time. 
+Meanwhile, ``ex2()`` takes about 1 second, much faster than it would normally
+take to call ``func()`` five times iteratively. Ray is running each call to
+``func()`` in parallel, saving us time.
 
-``ex1()`` is actually a common user mistake in Ray. ``ray.get`` is not 
-necessary to do before adding the result of ``func()`` to the list. Instead, 
-the driver should send out all parallelizable calls to the remote function 
+``ex1()`` is actually a common user mistake in Ray. ``ray.get`` is not
+necessary to do before adding the result of ``func()`` to the list. Instead,
+the driver should send out all parallelizable calls to the remote function
 to Ray before waiting to receive their results with ``ray.get``. ``ex1()``'s
 suboptimal behavior can be noticed just using this simple timing test.
 
-Realistically, however, many applications are not as highly parallelizable 
-as ``ex2()``, and the application includes sections where the code must run in 
+Realistically, however, many applications are not as highly parallelizable
+as ``ex2()``, and the application includes sections where the code must run in
 serial. ``ex3()`` is such an example, where the local function ``other_func()``
-must run first before each call to ``func()`` can be submitted to Ray. 
+must run first before each call to ``func()`` can be submitted to Ray.
 
 .. code-block:: python
 
@@ -196,23 +196,23 @@ must run first before each call to ``func()`` can be submitted to Ray.
           list2.append(func.remote())
       ray.get(list3)
 
-What results is that while ``ex3()`` still gained 0.5 seconds of speedup 
+What results is that while ``ex3()`` still gained 0.5 seconds of speedup
 compared to the completely serialized ``ex1()`` version, this speedup is
-still nowhere near the ideal speedup of ``ex2()``. 
+still nowhere near the ideal speedup of ``ex2()``.
 
-The dramatic speedup of ``ex2()`` is possible because ``ex2()`` is 
-theoretically completely parallelizable: if we were given 5 CPUs, all 5 calls 
-to ``func()`` can be run in parallel. What is happening with ``ex3()``, 
-however, is that each parallelized call to ``func()`` is staggered by a wait 
+The dramatic speedup of ``ex2()`` is possible because ``ex2()`` is
+theoretically completely parallelizable: if we were given 5 CPUs, all 5 calls
+to ``func()`` can be run in parallel. What is happening with ``ex3()``,
+however, is that each parallelized call to ``func()`` is staggered by a wait
 of 0.3 seconds for the local ``other_func()`` to finish.
 
-``ex3()`` is thus a manifestation of `Amdahls Law`_: the fastest theoretically 
-possible execution time from parallelizing an application is limited to be 
-no better than the time it takes to run all serial parts in serial. 
+``ex3()`` is thus a manifestation of `Amdahls Law`_: the fastest theoretically
+possible execution time from parallelizing an application is limited to be
+no better than the time it takes to run all serial parts in serial.
 
 .. _`Amdahls Law`: https://en.wikipedia.org/wiki/Amdahl%27s_law
 
-Due to Amdahl's Law, ``ex3()`` must take at least 1.5 
+Due to Amdahl's Law, ``ex3()`` must take at least 1.5
 seconds -- the time it takes for 5 serial calls to ``other_func()`` to finish!
 After an additional 0.5 seconds to execute func and get the result, the
 computation is done.
@@ -224,7 +224,7 @@ Profiling Using An External Profiler (Line Profiler)
 One way to profile the performance of our code using Ray is to use a third-party
 profiler such as `Line_profiler`_. Line_profiler is a useful line-by-line
 profiler for pure Python applications that formats its output side-by-side with
-the profiled code itself. 
+the profiled code itself.
 
 Alternatively, another third-party profiler (not covered in this documentation)
 that you could use is `Pyflame`_, which can generate profiling graphs.
@@ -238,11 +238,11 @@ First install ``line_profiler`` with pip:
 
   pip install line_profiler
 
-``line_profiler`` requires each section of driver code that you want to profile as 
-its own independent function. Conveniently, we have already done so by defining 
+``line_profiler`` requires each section of driver code that you want to profile as
+its own independent function. Conveniently, we have already done so by defining
 each loop version as its own function. To tell ``line_profiler`` which functions
-to profile, just add the ``@profile`` decorator to ``ex1()``, ``ex2()`` and 
-``ex3()``. Note that you do not need to import ``line_profiler`` into your Ray 
+to profile, just add the ``@profile`` decorator to ``ex1()``, ``ex2()`` and
+``ex3()``. Note that you do not need to import ``line_profiler`` into your Ray
 application:
 
 .. code-block:: python
@@ -262,16 +262,16 @@ application:
   if __name__ == "__main__":
       main()
 
-Then, when we want to execute our Python script from the command line, instead 
-of ``python your_script_here.py``, we use the following shell command to run the 
+Then, when we want to execute our Python script from the command line, instead
+of ``python your_script_here.py``, we use the following shell command to run the
 script with ``line_profiler`` enabled:
 
 .. code-block:: bash
 
-  kernprof -l your_script_here.py 
+  kernprof -l your_script_here.py
 
-This command runs your script and prints only your script's output as usual. 
-``Line_profiler`` instead outputs its profiling results to a corresponding 
+This command runs your script and prints only your script's output as usual.
+``Line_profiler`` instead outputs its profiling results to a corresponding
 binary file called ``your_script_here.py.lprof``.
 
 To read ``line_profiler``'s results to terminal, use this shell command:
@@ -300,10 +300,10 @@ Note that execution time is given in units of 1e-06 seconds:
       33         5    2508805.0 501761.0    100.0     list1.append(ray.get(func.remote()))
 
 
-Notice that each hit to ``list1.append(ray.get(func.remote()))`` at line 33 
-takes the full 0.5 seconds waiting for ``func()`` to finish. Meanwhile, in 
-``ex2()`` below, each call of ``func.remote()`` at line 40 only takes 0.127 ms, 
-and the majority of the time (about 1 second) is spent on waiting for ``ray.get()`` 
+Notice that each hit to ``list1.append(ray.get(func.remote()))`` at line 33
+takes the full 0.5 seconds waiting for ``func()`` to finish. Meanwhile, in
+``ex2()`` below, each call of ``func.remote()`` at line 40 only takes 0.127 ms,
+and the majority of the time (about 1 second) is spent on waiting for ``ray.get()``
 at the end:
 
 
@@ -323,11 +323,11 @@ at the end:
       41         1    1002919.0 1002919.0     99.9    ray.get(list2)
 
 
-And finally, ``line_profiler``'s output for ``ex3()``. Each call to 
-``func.remote()`` at line 50 still take magnitudes faster than 0.5 seconds, 
-showing that Ray is successfully parallelizing the remote calls. However, each 
-call to the local function ``other_func()`` takes the full 0.3 seconds, 
-totalling up to the guaranteed minimum application execution time of 1.5 
+And finally, ``line_profiler``'s output for ``ex3()``. Each call to
+``func.remote()`` at line 50 still take magnitudes faster than 0.5 seconds,
+showing that Ray is successfully parallelizing the remote calls. However, each
+call to the local function ``other_func()`` takes the full 0.3 seconds,
+totalling up to the guaranteed minimum application execution time of 1.5
 seconds:
 
 .. code-block:: bash
@@ -351,20 +351,20 @@ seconds:
 Profiling Using Python's CProfile
 ---------------------------------
 
-A second way to profile the performance of your Ray application is to 
-use Python's native cProfile `profiling module`_. Rather than tracking 
+A second way to profile the performance of your Ray application is to
+use Python's native cProfile `profiling module`_. Rather than tracking
 line-by-line of your application code, cProfile can give the total runtime
 of each loop function, as well as list the number of calls made and
-execution time of all function calls made within the profiled code. 
+execution time of all function calls made within the profiled code.
 
 .. _`profiling module`: https://docs.python.org/3/library/profile.html#module-cProfile
 
-Unlike ``line_profiler`` above, this detailed list of profiled function calls 
-**includes** internal function calls and function calls made within Ray! 
+Unlike ``line_profiler`` above, this detailed list of profiled function calls
+**includes** internal function calls and function calls made within Ray!
 
-However, similar to ``line_profiler``, cProfile can be enabled with minimal 
-changes to your application code (given that each section of the code you want 
-to profile is defined as its own function). To use cProfile, add an import 
+However, similar to ``line_profiler``, cProfile can be enabled with minimal
+changes to your application code (given that each section of the code you want
+to profile is defined as its own function). To use cProfile, add an import
 statement, then replace calls to the loop functions as follows:
 
 .. code-block:: python
@@ -385,17 +385,17 @@ statement, then replace calls to the loop functions as follows:
   if __name__ == "__main__":
       main()
 
-Now, when executing your Python script, a cProfile list of profiled function 
+Now, when executing your Python script, a cProfile list of profiled function
 calls will be outputted to terminal for each call made to ``cProfile.run()``.
-At the very top of cProfile's output gives the total execution time for 
+At the very top of cProfile's output gives the total execution time for
 ``'ex1()'``:
 
 .. code-block:: bash
 
   601 function calls (595 primitive calls) in 2.509 seconds
 
-Following is a snippet of profiled function calls for ``'ex1()'``. Most of 
-these calls are quick and take around 0.000 seconds, so the functions of 
+Following is a snippet of profiled function calls for ``'ex1()'``. Most of
+these calls are quick and take around 0.000 seconds, so the functions of
 interest are the ones with non-zero execution times:
 
 .. code-block:: bash
@@ -405,7 +405,7 @@ interest are the ones with non-zero execution times:
       1    0.000    0.000    2.509    2.509 your_script_here.py:31(ex1)
       5    0.000    0.000    0.001    0.000 remote_function.py:103(remote)
       5    0.000    0.000    0.001    0.000 remote_function.py:107(_submit)
-  ...  
+  ...
      10    0.000    0.000    0.000    0.000 worker.py:2459(__init__)
       5    0.000    0.000    2.508    0.502 worker.py:2535(get)
       5    0.000    0.000    0.000    0.000 worker.py:2695(get_global_worker)
@@ -414,25 +414,25 @@ interest are the ones with non-zero execution times:
       5    0.000    0.000    0.000    0.000 worker.py:514(submit_task)
   ...
 
-The 5 separate calls to Ray's ``get``, taking the full 0.502 seconds each call, 
-can be noticed at ``worker.py:2535(get)``. Meanwhile, the act of calling the 
-remote function itself at ``remote_function.py:103(remote)`` only takes 0.001 
-seconds over 5 calls, and thus is not the source of the slow performance of 
+The 5 separate calls to Ray's ``get``, taking the full 0.502 seconds each call,
+can be noticed at ``worker.py:2535(get)``. Meanwhile, the act of calling the
+remote function itself at ``remote_function.py:103(remote)`` only takes 0.001
+seconds over 5 calls, and thus is not the source of the slow performance of
 ``ex1()``.
 
 
 Profiling Ray Actors with cProfile
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Considering that the detailed output of cProfile can be quite different depending 
-on what Ray functionalities we use, let us see what cProfile's output might look 
-like if our example involved Actors (for an introduction to Ray actors, see our 
-`Actor documentation here`_). 
+Considering that the detailed output of cProfile can be quite different depending
+on what Ray functionalities we use, let us see what cProfile's output might look
+like if our example involved Actors (for an introduction to Ray actors, see our
+`Actor documentation here`_).
 
 .. _`Actor documentation here`: http://ray.readthedocs.io/en/latest/actors.html
 
 Now, instead of looping over five calls to a remote function like in ``ex1``,
-let's create a new example and loop over five calls to a remote function 
+let's create a new example and loop over five calls to a remote function
 **inside an actor**. Our actor's remote function again just sleeps for 0.5
 seconds:
 
@@ -440,7 +440,7 @@ seconds:
 
   # Our actor
   @ray.remote
-  class Sleeper(object):  
+  class Sleeper(object):
       def __init__(self):
           self.sleepValue = 0.5
 
@@ -448,7 +448,7 @@ seconds:
       def actor_func(self):
           time.sleep(self.sleepValue)
 
-Recalling the suboptimality of ``ex1``, let's first see what happens if we 
+Recalling the suboptimality of ``ex1``, let's first see what happens if we
 attempt to perform all five ``actor_func()`` calls within a single actor:
 
 .. code-block:: python
@@ -470,7 +470,7 @@ We enable cProfile on this example as follows:
 
   def main():
       ray.init()
-      cProfile.run('ex4()') 
+      cProfile.run('ex4()')
 
   if __name__ == "__main__":
       main()
@@ -497,22 +497,22 @@ Running our new Actor example, cProfile's abbreviated output is as follows:
   8    0.000    0.000    0.001    0.000 worker.py:514(submit_task)
   ...
 
-It turns out that the entire example still took 2.5 seconds to execute, or the 
-time for five calls to ``actor_func()`` to run in serial. We remember in ``ex1`` 
-that this behavior was because we did not wait until after submitting all five 
+It turns out that the entire example still took 2.5 seconds to execute, or the
+time for five calls to ``actor_func()`` to run in serial. We remember in ``ex1``
+that this behavior was because we did not wait until after submitting all five
 remote function tasks to call ``ray.get()``, but we can verify on cProfile's
-output line ``worker.py:2535(get)`` that ``ray.get()`` was only called once at 
-the end, for 2.509 seconds. What happened? 
+output line ``worker.py:2535(get)`` that ``ray.get()`` was only called once at
+the end, for 2.509 seconds. What happened?
 
-It turns out Ray cannot parallelize this example, because we have only 
-initialized a single ``Sleeper`` actor. Because each actor is a single, 
-stateful worker, our entire code is submitted and ran on a single worker the 
+It turns out Ray cannot parallelize this example, because we have only
+initialized a single ``Sleeper`` actor. Because each actor is a single,
+stateful worker, our entire code is submitted and ran on a single worker the
 whole time.
 
 To better parallelize the actors in ``ex4``, we can take advantage
 that each call to ``actor_func()`` is independent, and instead
 create five ``Sleeper`` actors. That way, we are creating five workers
-that can run in parallel, instead of creating a single worker that 
+that can run in parallel, instead of creating a single worker that
 can only handle one call to ``actor_func()`` at a time.
 
 .. code-block:: python
@@ -530,7 +530,7 @@ can only handle one call to ``actor_func()`` at a time.
 
 Our example in total now takes only 1.5 seconds to run:
 
-.. code-block:: bash 
+.. code-block:: bash
 
   1378 function calls (1363 primitive calls) in 1.567 seconds
 
@@ -553,27 +553,27 @@ Our example in total now takes only 1.5 seconds to run:
 
 Visualizing Tasks in the Ray Timeline
 -------------------------------------
-Profiling the performance of your Ray application doesn't need to be 
-an eye-straining endeavor of interpreting numbers among hundreds of 
-lines of text. Ray comes with its own visual web UI to visualize the 
+Profiling the performance of your Ray application doesn't need to be
+an eye-straining endeavor of interpreting numbers among hundreds of
+lines of text. Ray comes with its own visual web UI to visualize the
 parallelization (or lack thereof) of user tasks submitted to Ray!
 
-This method does have its own limitations, however. The Ray Timeline 
+This method does have its own limitations, however. The Ray Timeline
 can only show timing info about Ray tasks, and not timing for normal
 Python functions. This can be an issue especially for debugging slow
-Python code that is running on the driver, and not running as a task on 
-one of the workers. The other profiling techniques above are options that 
+Python code that is running on the driver, and not running as a task on
+one of the workers. The other profiling techniques above are options that
 do cover profiling normal Python functions.
 
 Currently, whenever initializing Ray, a URL is generated and printed
-in the terminal. This URL can be used to view Ray's web UI as a Jupyter 
+in the terminal. This URL can be used to view Ray's web UI as a Jupyter
 notebook:
 
 .. code-block:: bash
 
   ~$: python your_script_here.py
 
-  Process STDOUT and STDERR is being redirected to /tmp/raylogs/.
+  Process STDOUT and STDERR is being redirected to /tmp/ray/session_2018-11-01_14-31-43_27211/logs.
   Waiting for redis server at 127.0.0.1:61150 to respond...
   Waiting for redis server at 127.0.0.1:21607 to respond...
   Starting local scheduler with the following resources: {'CPU': 4, 'GPU': 0}.
@@ -582,13 +582,13 @@ notebook:
   View the web UI at http://localhost:8897/notebooks/ray_ui84907.ipynb?token=025e8ab295270a57fac209204b37349fdf34e037671a13ff
   ======================================================================
 
-Ray's web UI attempts to run on localhost at port 8888, and if it fails 
-it tries successive ports until it finds an open port. In this above 
+Ray's web UI attempts to run on localhost at port 8888, and if it fails
+it tries successive ports until it finds an open port. In this above
 example, it has opened on port 8897.
 
-Because this web UI is only available as long as your Ray application 
-is currently running, you may need to add a user prompt to prevent 
-your Ray application from exiting once it has finished executing,  
+Because this web UI is only available as long as your Ray application
+is currently running, you may need to add a user prompt to prevent
+your Ray application from exiting once it has finished executing,
 such as below. You can then browse the web UI for as long as you like:
 
 .. code-block:: python
@@ -606,44 +606,44 @@ such as below. You can then browse the web UI for as long as you like:
       main()
 
 Now, when executing your python script, you can access the Ray timeline
-by copying the web UI URL into your web browser on the Ray machine. To 
-load the web UI in the jupyter notebook, select **Kernel -> Restart and 
+by copying the web UI URL into your web browser on the Ray machine. To
+load the web UI in the jupyter notebook, select **Kernel -> Restart and
 Run All** in the jupyter menu.
 
-The Ray timeline can be viewed in the fourth cell of the UI notebook by 
-using the task filter options, then clicking on the **View task timeline** 
+The Ray timeline can be viewed in the fourth cell of the UI notebook by
+using the task filter options, then clicking on the **View task timeline**
 button.
 
-For example, here are the results of executing ``ex1()``, ``ex2()``, and 
-``ex3()`` visualized in the Ray timeline. Each red block is a call to one 
-of our user-defined remote functions, namely ``func()``, which sleeps for 
+For example, here are the results of executing ``ex1()``, ``ex2()``, and
+``ex3()`` visualized in the Ray timeline. Each red block is a call to one
+of our user-defined remote functions, namely ``func()``, which sleeps for
 0.5 seconds:
 
 .. image:: user-profiling-timeline.gif
 
-(highlighted color boxes for ``ex1()``, ``ex2()``, and ``ex3()`` added for 
+(highlighted color boxes for ``ex1()``, ``ex2()``, and ``ex3()`` added for
 the sake of this example)
 
-Note how ``ex1()`` executes all five calls to ``func()`` in serial, 
+Note how ``ex1()`` executes all five calls to ``func()`` in serial,
 while ``ex2()`` and ``ex3()`` are able to parallelize their remote
-function calls. 
+function calls.
 
-Because we have 4 CPUs available on our machine, we can only able to 
-execute up to 4 remote functions in parallel. So, the fifth call to the 
-remote function in ``ex2()`` must wait until the first batch of ``func()`` 
+Because we have 4 CPUs available on our machine, we can only able to
+execute up to 4 remote functions in parallel. So, the fifth call to the
+remote function in ``ex2()`` must wait until the first batch of ``func()``
 calls is finished.
 
-In ``ex3()``, because of the serial dependency on ``other_func()``, we 
+In ``ex3()``, because of the serial dependency on ``other_func()``, we
 aren't even able to use all 4 of our cores to parallelize calls to ``func()``.
 The time gaps between the ``func()`` blocks are a result of staggering the
-calls to ``func()`` in between waiting 0.3 seconds for ``other_func()``. 
+calls to ``func()`` in between waiting 0.3 seconds for ``other_func()``.
 
-Also, notice that due to the aforementioned limitation of the Ray timeline, 
-``other_func()``, as a driver function and not a Ray task, is never 
+Also, notice that due to the aforementioned limitation of the Ray timeline,
+``other_func()``, as a driver function and not a Ray task, is never
 visualized on the Ray timeline.
 
 **For more on Ray's Web UI,** such as how to access the UI on a remote
-node over ssh, or for troubleshooting installation, please see our 
+node over ssh, or for troubleshooting installation, please see our
 `Web UI documentation section`_.
 
 .. _`Web UI documentation section`: http://ray.readthedocs.io/en/latest/webui.html
diff --git a/doc/source/using-ray-and-docker-on-a-cluster.md b/doc/source/using-ray-and-docker-on-a-cluster.md
index 9ae39d17851ef..4e7b7a52d9bd6 100644
--- a/doc/source/using-ray-and-docker-on-a-cluster.md
+++ b/doc/source/using-ray-and-docker-on-a-cluster.md
@@ -1,4 +1,4 @@
-# Using Ray and Docker on a Cluster (EXPERIMENTAL)
+# Using Ray and Docker on a Cluster (Experimental)
 
 Packaging and deploying an application using Docker can provide certain advantages. It can make managing dependencies easier, help ensure that each cluster node receives a uniform configuration, and facilitate swapping hardware resources between applications.
 
diff --git a/doc/source/using-ray-on-a-cluster.rst b/doc/source/using-ray-on-a-cluster.rst
index 29c2585ac7cfe..611e47b79db23 100644
--- a/doc/source/using-ray-on-a-cluster.rst
+++ b/doc/source/using-ray-on-a-cluster.rst
@@ -51,7 +51,6 @@ Now we've started all of the Ray processes on each node Ray. This includes
 - An object store on each machine.
 - A local scheduler on each machine.
 - Multiple Redis servers (on the head node).
-- One global scheduler (on the head node).
 
 To run some commands, start up Python on one of the nodes in the cluster, and do
 the following.
diff --git a/doc/source/using-ray-on-a-large-cluster.rst b/doc/source/using-ray-on-a-large-cluster.rst
index c3d6d8a8d2389..b87c8c05f5125 100644
--- a/doc/source/using-ray-on-a-large-cluster.rst
+++ b/doc/source/using-ray-on-a-large-cluster.rst
@@ -154,7 +154,6 @@ Now you have started all of the Ray processes on each node. These include:
 - An object store on each machine.
 - A local scheduler on each machine.
 - Multiple Redis servers (on the head node).
-- One global scheduler (on the head node).
 
 To confirm that the Ray cluster setup is working, start up Python on one of the
 nodes in the cluster and enter the following commands to connect to the Ray
diff --git a/docker/examples/Dockerfile b/docker/examples/Dockerfile
index d4e6c34b22179..9cdee4ff117eb 100644
--- a/docker/examples/Dockerfile
+++ b/docker/examples/Dockerfile
@@ -5,6 +5,7 @@ FROM ray-project/deploy
 # This updates numpy to 1.14 and mutes errors from other libraries
 RUN conda install -y numpy
 RUN apt-get install -y zlib1g-dev
-RUN pip install gym[atari] opencv-python==3.2.0.8 tensorflow lz4 keras
+RUN pip install gym[atari] opencv-python==3.2.0.8 tensorflow lz4 keras pytest-timeout
+RUN pip install -U h5py  # Mutes FutureWarnings
 RUN pip install --upgrade git+git://github.com/hyperopt/hyperopt.git
 RUN conda install pytorch-cpu torchvision-cpu -c pytorch
diff --git a/examples/carla/a3c_lane_keep.py b/examples/carla/a3c_lane_keep.py
deleted file mode 100644
index 1338736d23f5e..0000000000000
--- a/examples/carla/a3c_lane_keep.py
+++ /dev/null
@@ -1,52 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import ray
-from ray.tune import register_env, run_experiments
-
-from env import CarlaEnv, ENV_CONFIG
-from models import register_carla_model
-from scenarios import LANE_KEEP
-
-env_name = "carla_env"
-env_config = ENV_CONFIG.copy()
-env_config.update({
-    "verbose": False,
-    "x_res": 80,
-    "y_res": 80,
-    "use_depth_camera": False,
-    "discrete_actions": False,
-    "server_map": "/Game/Maps/Town02",
-    "reward_function": "lane_keep",
-    "enable_planner": False,
-    "scenarios": [LANE_KEEP],
-})
-
-register_env(env_name, lambda env_config: CarlaEnv(env_config))
-register_carla_model()
-
-ray.init()
-run_experiments({
-    "carla-a3c": {
-        "run": "A3C",
-        "env": "carla_env",
-        "trial_resources": {"cpu": 4, "gpu": 1},
-        "config": {
-            "env_config": env_config,
-            "model": {
-                "custom_model": "carla",
-                "custom_options": {
-                    "image_shape": [80, 80, 6],
-                },
-                "conv_filters": [
-                    [16, [8, 8], 4],
-                    [32, [4, 4], 2],
-                    [512, [10, 10], 1],
-                ],
-            },
-            "gamma": 0.8,
-            "num_workers": 1,
-        },
-    },
-})
diff --git a/examples/carla/dqn_lane_keep.py b/examples/carla/dqn_lane_keep.py
deleted file mode 100644
index 2746a1c4bbd89..0000000000000
--- a/examples/carla/dqn_lane_keep.py
+++ /dev/null
@@ -1,57 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import ray
-from ray.tune import register_env, run_experiments
-
-from env import CarlaEnv, ENV_CONFIG
-from models import register_carla_model
-from scenarios import LANE_KEEP
-
-env_name = "carla_env"
-env_config = ENV_CONFIG.copy()
-env_config.update({
-    "verbose": False,
-    "x_res": 80,
-    "y_res": 80,
-    "use_depth_camera": False,
-    "discrete_actions": True,
-    "server_map": "/Game/Maps/Town02",
-    "reward_function": "lane_keep",
-    "enable_planner": False,
-    "scenarios": [LANE_KEEP],
-})
-
-register_env(env_name, lambda env_config: CarlaEnv(env_config))
-register_carla_model()
-
-ray.init()
-run_experiments({
-    "carla-dqn": {
-        "run": "DQN",
-        "env": "carla_env",
-        "trial_resources": {"cpu": 4, "gpu": 1},
-        "config": {
-            "env_config": env_config,
-            "model": {
-                "custom_model": "carla",
-                "custom_options": {
-                    "image_shape": [80, 80, 6],
-                },
-                "conv_filters": [
-                    [16, [8, 8], 4],
-                    [32, [4, 4], 2],
-                    [512, [10, 10], 1],
-                ],
-            },
-            "timesteps_per_iteration": 100,
-            "learning_starts": 1000,
-            "schedule_max_timesteps": 100000,
-            "gamma": 0.8,
-            "tf_session_args": {
-              "gpu_options": {"allow_growth": True},
-            },
-        },
-    },
-})
diff --git a/examples/carla/ppo_lane_keep.py b/examples/carla/ppo_lane_keep.py
deleted file mode 100644
index 25e5acbf328c4..0000000000000
--- a/examples/carla/ppo_lane_keep.py
+++ /dev/null
@@ -1,62 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import ray
-from ray.tune import register_env, run_experiments
-
-from env import CarlaEnv, ENV_CONFIG
-from models import register_carla_model
-from scenarios import LANE_KEEP
-
-env_name = "carla_env"
-env_config = ENV_CONFIG.copy()
-env_config.update({
-    "verbose": False,
-    "x_res": 80,
-    "y_res": 80,
-    "use_depth_camera": False,
-    "discrete_actions": False,
-    "server_map": "/Game/Maps/Town02",
-    "reward_function": "lane_keep",
-    "enable_planner": False,
-    "scenarios": [LANE_KEEP],
-})
-
-register_env(env_name, lambda env_config: CarlaEnv(env_config))
-register_carla_model()
-
-ray.init()
-run_experiments({
-    "carla-ppo": {
-        "run": "PPO",
-        "env": "carla_env",
-        "trial_resources": {"cpu": 4, "gpu": 1},
-        "config": {
-            "env_config": env_config,
-            "model": {
-                "custom_model": "carla",
-                "custom_options": {
-                    "image_shape": [80, 80, 6],
-                },
-                "conv_filters": [
-                    [16, [8, 8], 4],
-                    [32, [4, 4], 2],
-                    [512, [10, 10], 1],
-                ],
-            },
-            "num_workers": 1,
-            "timesteps_per_batch": 2000,
-            "min_steps_per_task": 100,
-            "lambda": 0.95,
-            "clip_param": 0.2,
-            "num_sgd_iter": 20,
-            "sgd_stepsize": 0.0001,
-            "sgd_batchsize": 32,
-            "devices": ["/gpu:0"],
-            "tf_session_args": {
-              "gpu_options": {"allow_growth": True}
-            }
-        },
-    },
-})
diff --git a/examples/carla/scenarios.py b/examples/carla/scenarios.py
deleted file mode 100644
index e6494af1830d0..0000000000000
--- a/examples/carla/scenarios.py
+++ /dev/null
@@ -1,119 +0,0 @@
-"""Collection of Carla scenarios, including those from the CoRL 2017 paper."""
-
-
-TEST_WEATHERS = [0, 2, 5, 7, 9, 10, 11, 12, 13]
-TRAIN_WEATHERS = [1, 3, 4, 6, 8, 14]
-
-
-def build_scenario(
-        city, start, end, vehicles, pedestrians, max_steps, weathers):
-    return {
-        "city": city,
-        "num_vehicles": vehicles,
-        "num_pedestrians": pedestrians,
-        "weather_distribution": weathers,
-        "start_pos_id": start,
-        "end_pos_id": end,
-        "max_steps": max_steps,
-    }
-
-
-# Simple scenario for Town02 that involves driving down a road
-DEFAULT_SCENARIO = build_scenario(
-    city="Town02", start=36, end=40, vehicles=20, pedestrians=40,
-    max_steps=200, weathers=[0])
-
-# Simple scenario for Town02 that involves driving down a road
-LANE_KEEP = build_scenario(
-    city="Town02", start=36, end=40, vehicles=0, pedestrians=0,
-    max_steps=2000, weathers=[0])
-
-# Scenarios from the CoRL2017 paper
-POSES_TOWN1_STRAIGHT = [
-    [36, 40], [39, 35], [110, 114], [7, 3], [0, 4],
-    [68, 50], [61, 59], [47, 64], [147, 90], [33, 87],
-    [26, 19], [80, 76], [45, 49], [55, 44], [29, 107],
-    [95, 104], [84, 34], [53, 67], [22, 17], [91, 148],
-    [20, 107], [78, 70], [95, 102], [68, 44], [45, 69]]
-
-
-POSES_TOWN1_ONE_CURVE = [
-    [138, 17], [47, 16], [26, 9], [42, 49], [140, 124],
-    [85, 98], [65, 133], [137, 51], [76, 66], [46, 39],
-    [40, 60], [0, 29], [4, 129], [121, 140], [2, 129],
-    [78, 44], [68, 85], [41, 102], [95, 70], [68, 129],
-    [84, 69], [47, 79], [110, 15], [130, 17], [0, 17]]
-
-POSES_TOWN1_NAV = [
-    [105, 29], [27, 130], [102, 87], [132, 27], [24, 44],
-    [96, 26], [34, 67], [28, 1], [140, 134], [105, 9],
-    [148, 129], [65, 18], [21, 16], [147, 97], [42, 51],
-    [30, 41], [18, 107], [69, 45], [102, 95], [18, 145],
-    [111, 64], [79, 45], [84, 69], [73, 31], [37, 81]]
-
-
-POSES_TOWN2_STRAIGHT = [
-    [38,  34],  [4,  2],  [12,  10],  [62,  55],  [43,  47],
-    [64,  66],  [78,  76], [59, 57], [61, 18], [35, 39],
-    [12, 8], [0, 18], [75, 68], [54, 60], [45, 49],
-    [46, 42], [53, 46], [80, 29], [65, 63], [0, 81],
-    [54, 63], [51, 42], [16, 19], [17, 26], [77, 68]]
-
-POSES_TOWN2_ONE_CURVE = [
-    [37,  76],  [8,  24],  [60,  69],  [38,  10],  [21,  1],
-    [58, 71], [74, 32], [44, 0], [71, 16], [14, 24],
-    [34, 11], [43, 14], [75, 16], [80, 21], [3, 23],
-    [75, 59], [50, 47], [11, 19], [77, 34], [79, 25],
-    [40, 63], [58, 76], [79, 55], [16, 61], [27, 11]]
-
-POSES_TOWN2_NAV = [
-    [19, 66], [79, 14], [19, 57], [23, 1],
-    [53, 76], [42, 13], [31, 71], [33, 5],
-    [54, 30], [10, 61], [66, 3], [27, 12],
-    [79, 19], [2, 29], [16, 14], [5, 57],
-    [70, 73], [46, 67], [57, 50], [61, 49], [21, 12],
-    [51, 81], [77, 68], [56, 65], [43, 54]]
-
-TOWN1_STRAIGHT = [
-    build_scenario("Town01", start, end, 0, 0, 300, TEST_WEATHERS)
-    for (start, end) in POSES_TOWN1_STRAIGHT]
-
-TOWN1_ONE_CURVE = [
-    build_scenario("Town01", start, end, 0, 0, 600, TEST_WEATHERS)
-    for (start, end) in POSES_TOWN1_ONE_CURVE]
-
-TOWN1_NAVIGATION = [
-    build_scenario("Town01", start, end, 0, 0, 900, TEST_WEATHERS)
-    for (start, end) in POSES_TOWN1_NAV]
-
-TOWN1_NAVIGATION_DYNAMIC = [
-    build_scenario("Town01", start, end, 20, 50, 900, TEST_WEATHERS)
-    for (start, end) in POSES_TOWN1_NAV]
-
-TOWN2_STRAIGHT = [
-    build_scenario("Town02", start, end, 0, 0, 300, TRAIN_WEATHERS)
-    for (start, end) in POSES_TOWN2_STRAIGHT]
-
-TOWN2_STRAIGHT_DYNAMIC = [
-    build_scenario("Town02", start, end, 20, 50, 300, TRAIN_WEATHERS)
-    for (start, end) in POSES_TOWN2_STRAIGHT]
-
-TOWN2_ONE_CURVE = [
-    build_scenario("Town02", start, end, 0, 0, 600, TRAIN_WEATHERS)
-    for (start, end) in POSES_TOWN2_ONE_CURVE]
-
-TOWN2_NAVIGATION = [
-    build_scenario("Town02", start, end, 0, 0, 900, TRAIN_WEATHERS)
-    for (start, end) in POSES_TOWN2_NAV]
-
-TOWN2_NAVIGATION_DYNAMIC = [
-    build_scenario("Town02", start, end, 20, 50, 900, TRAIN_WEATHERS)
-    for (start, end) in POSES_TOWN2_NAV]
-
-TOWN1_ALL = (
-    TOWN1_STRAIGHT + TOWN1_ONE_CURVE + TOWN1_NAVIGATION +
-    TOWN1_NAVIGATION_DYNAMIC)
-
-TOWN2_ALL = (
-    TOWN2_STRAIGHT + TOWN2_ONE_CURVE + TOWN2_NAVIGATION +
-    TOWN2_NAVIGATION_DYNAMIC)
diff --git a/examples/custom_env/README b/examples/custom_env/README
deleted file mode 100644
index 75ffcad88fb35..0000000000000
--- a/examples/custom_env/README
+++ /dev/null
@@ -1 +0,0 @@
-Example of using a custom gym env with RLlib.
diff --git a/java/README.rst b/java/README.rst
index 95ab961e769dc..e016169357874 100644
--- a/java/README.rst
+++ b/java/README.rst
@@ -7,6 +7,7 @@ Ray will read your configurations in the following order:
 
 * Java system properties: e.g., ``-Dray.home=/path/to/ray``.
 * A ``ray.conf`` file in the classpath: `example <https://github.com/ray-project/ray/blob/master/java/example.conf>`_.
+* Customise your own ``ray.conf`` path using system property ``-Dray.config=/path/to/ray.conf``
 
 For all available config items and default values, see `this file <https://github.com/ray-project/ray/blob/master/java/runtime/src/main/resources/ray.default.conf>`_.
 
diff --git a/java/api/src/main/java/org/ray/api/Ray.java b/java/api/src/main/java/org/ray/api/Ray.java
index 053f01d5534d3..7e252274ef735 100644
--- a/java/api/src/main/java/org/ray/api/Ray.java
+++ b/java/api/src/main/java/org/ray/api/Ray.java
@@ -41,7 +41,10 @@ public static synchronized void init(RayRuntimeFactory factory) {
    * Shutdown Ray runtime.
    */
   public static void shutdown() {
-    runtime.shutdown();
+    if (runtime != null) {
+      runtime.shutdown();
+      runtime = null;
+    }
   }
 
   /**
diff --git a/java/api/src/main/java/org/ray/api/RayCall.java b/java/api/src/main/java/org/ray/api/RayCall.java
index ef40a238c0e29..967830199402c 100644
--- a/java/api/src/main/java/org/ray/api/RayCall.java
+++ b/java/api/src/main/java/org/ray/api/RayCall.java
@@ -2,6 +2,7 @@
 
 package org.ray.api;
 
+import org.ray.api.function.RayFunc;
 import org.ray.api.function.RayFunc0;
 import org.ray.api.function.RayFunc1;
 import org.ray.api.function.RayFunc2;
@@ -9,6 +10,9 @@
 import org.ray.api.function.RayFunc4;
 import org.ray.api.function.RayFunc5;
 import org.ray.api.function.RayFunc6;
+import org.ray.api.options.ActorCreationOptions;
+import org.ray.api.options.BaseTaskOptions;
+import org.ray.api.options.CallOptions;
 
 /**
  * This class provides type-safe interfaces for `Ray.call` and `Ray.createActor`.
@@ -20,511 +24,1019 @@ class RayCall {
   // =======================================
   public static <R> RayObject<R> call(RayFunc0<R> f) {
     Object[] args = new Object[]{};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
+  }
+  public static <R> RayObject<R> call(RayFunc0<R> f, CallOptions options) {
+    Object[] args = new Object[]{};
+    return Ray.internal().call(f, args, options);
   }
   public static <T0, R> RayObject<R> call(RayFunc1<T0, R> f, T0 t0) {
     Object[] args = new Object[]{t0};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, R> RayObject<R> call(RayFunc1<T0, R> f, RayObject<T0> t0) {
     Object[] args = new Object[]{t0};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
+  }
+  public static <T0, R> RayObject<R> call(RayFunc1<T0, R> f, T0 t0, CallOptions options) {
+    Object[] args = new Object[]{t0};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, R> RayObject<R> call(RayFunc1<T0, R> f, RayObject<T0> t0, CallOptions options) {
+    Object[] args = new Object[]{t0};
+    return Ray.internal().call(f, args, options);
   }
   public static <T0, T1, R> RayObject<R> call(RayFunc2<T0, T1, R> f, T0 t0, T1 t1) {
     Object[] args = new Object[]{t0, t1};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, R> RayObject<R> call(RayFunc2<T0, T1, R> f, T0 t0, RayObject<T1> t1) {
     Object[] args = new Object[]{t0, t1};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, R> RayObject<R> call(RayFunc2<T0, T1, R> f, RayObject<T0> t0, T1 t1) {
     Object[] args = new Object[]{t0, t1};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, R> RayObject<R> call(RayFunc2<T0, T1, R> f, RayObject<T0> t0, RayObject<T1> t1) {
     Object[] args = new Object[]{t0, t1};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
+  }
+  public static <T0, T1, R> RayObject<R> call(RayFunc2<T0, T1, R> f, T0 t0, T1 t1, CallOptions options) {
+    Object[] args = new Object[]{t0, t1};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, R> RayObject<R> call(RayFunc2<T0, T1, R> f, T0 t0, RayObject<T1> t1, CallOptions options) {
+    Object[] args = new Object[]{t0, t1};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, R> RayObject<R> call(RayFunc2<T0, T1, R> f, RayObject<T0> t0, T1 t1, CallOptions options) {
+    Object[] args = new Object[]{t0, t1};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, R> RayObject<R> call(RayFunc2<T0, T1, R> f, RayObject<T0> t0, RayObject<T1> t1, CallOptions options) {
+    Object[] args = new Object[]{t0, t1};
+    return Ray.internal().call(f, args, options);
   }
   public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, T0 t0, T1 t1, T2 t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, T0 t0, T1 t1, RayObject<T2> t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, T0 t0, RayObject<T1> t1, T2 t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, RayObject<T0> t0, T1 t1, T2 t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
+  }
+  public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, T0 t0, T1 t1, T2 t2, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, T0 t0, T1 t1, RayObject<T2> t2, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, T0 t0, RayObject<T1> t1, T2 t2, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, RayObject<T0> t0, T1 t1, T2 t2, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, R> RayObject<R> call(RayFunc3<T0, T1, T2, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().call(f, args, options);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, T1 t1, T2 t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, T1 t1, T2 t2, T3 t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, R> RayObject<R> call(RayFunc4<T0, T1, T2, T3, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().call(f, args, options);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc5<T0, T1, T2, T3, T4, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().call(f, args, options);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().call(f, args);
+    return Ray.internal().call(f, args, null);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, R> RayObject<R> call(RayFunc6<T0, T1, T2, T3, T4, T5, R> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, CallOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().call(f, args, options);
   }
   // ===========================================
   // Methods for remote actor method invocation.
@@ -786,510 +1298,1018 @@ public static <A, T0, T1, T2, T3, T4, R> RayObject<R> call(RayFunc6<A, T0, T1, T
   // ===========================
   public static <A> RayActor<A> createActor(RayFunc0<A> f) {
     Object[] args = new Object[]{};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
+  }
+  public static <A> RayActor<A> createActor(RayFunc0<A> f, ActorCreationOptions options) {
+    Object[] args = new Object[]{};
+    return Ray.internal().createActor(f, args, options);
   }
   public static <T0, A> RayActor<A> createActor(RayFunc1<T0, A> f, T0 t0) {
     Object[] args = new Object[]{t0};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, A> RayActor<A> createActor(RayFunc1<T0, A> f, RayObject<T0> t0) {
     Object[] args = new Object[]{t0};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
+  }
+  public static <T0, A> RayActor<A> createActor(RayFunc1<T0, A> f, T0 t0, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, A> RayActor<A> createActor(RayFunc1<T0, A> f, RayObject<T0> t0, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0};
+    return Ray.internal().createActor(f, args, options);
   }
   public static <T0, T1, A> RayActor<A> createActor(RayFunc2<T0, T1, A> f, T0 t0, T1 t1) {
     Object[] args = new Object[]{t0, t1};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, A> RayActor<A> createActor(RayFunc2<T0, T1, A> f, T0 t0, RayObject<T1> t1) {
     Object[] args = new Object[]{t0, t1};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, A> RayActor<A> createActor(RayFunc2<T0, T1, A> f, RayObject<T0> t0, T1 t1) {
     Object[] args = new Object[]{t0, t1};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, A> RayActor<A> createActor(RayFunc2<T0, T1, A> f, RayObject<T0> t0, RayObject<T1> t1) {
     Object[] args = new Object[]{t0, t1};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
+  }
+  public static <T0, T1, A> RayActor<A> createActor(RayFunc2<T0, T1, A> f, T0 t0, T1 t1, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, A> RayActor<A> createActor(RayFunc2<T0, T1, A> f, T0 t0, RayObject<T1> t1, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, A> RayActor<A> createActor(RayFunc2<T0, T1, A> f, RayObject<T0> t0, T1 t1, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, A> RayActor<A> createActor(RayFunc2<T0, T1, A> f, RayObject<T0> t0, RayObject<T1> t1, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1};
+    return Ray.internal().createActor(f, args, options);
   }
   public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, T0 t0, T1 t1, T2 t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, T0 t0, T1 t1, RayObject<T2> t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, T0 t0, RayObject<T1> t1, T2 t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, RayObject<T0> t0, T1 t1, T2 t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2) {
     Object[] args = new Object[]{t0, t1, t2};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
+  }
+  public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, T0 t0, T1 t1, T2 t2, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, T0 t0, T1 t1, RayObject<T2> t2, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, T0 t0, RayObject<T1> t1, T2 t2, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, RayObject<T0> t0, T1 t1, T2 t2, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, A> RayActor<A> createActor(RayFunc3<T0, T1, T2, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2};
+    return Ray.internal().createActor(f, args, options);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, T1 t1, T2 t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3) {
     Object[] args = new Object[]{t0, t1, t2, t3};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, T1 t1, T2 t2, T3 t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, A> RayActor<A> createActor(RayFunc4<T0, T1, T2, T3, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3};
+    return Ray.internal().createActor(f, args, options);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, A> RayActor<A> createActor(RayFunc5<T0, T1, T2, T3, T4, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4};
+    return Ray.internal().createActor(f, args, options);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
   }
   public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5) {
     Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
-    return Ray.internal().createActor(f, args);
+    return Ray.internal().createActor(f, args, null);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, T0 t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, T1 t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, T2 t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, T3 t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, T4 t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, T5 t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
+  }
+  public static <T0, T1, T2, T3, T4, T5, A> RayActor<A> createActor(RayFunc6<T0, T1, T2, T3, T4, T5, A> f, RayObject<T0> t0, RayObject<T1> t1, RayObject<T2> t2, RayObject<T3> t3, RayObject<T4> t4, RayObject<T5> t5, ActorCreationOptions options) {
+    Object[] args = new Object[]{t0, t1, t2, t3, t4, t5};
+    return Ray.internal().createActor(f, args, options);
   }
 }
diff --git a/java/api/src/main/java/org/ray/api/annotation/RayRemote.java b/java/api/src/main/java/org/ray/api/annotation/RayRemote.java
index a47e0768f0fbf..197ee663f58a0 100644
--- a/java/api/src/main/java/org/ray/api/annotation/RayRemote.java
+++ b/java/api/src/main/java/org/ray/api/annotation/RayRemote.java
@@ -15,10 +15,4 @@
 @Target({ElementType.METHOD, ElementType.TYPE})
 public @interface RayRemote {
 
-  /**
-   * Defines the quantity of various custom resources to reserve
-   * for this task or for the lifetime of the actor.
-   * @return an array of custom resource items.
-   */
-  ResourceItem[] resources() default {};
 }
diff --git a/java/api/src/main/java/org/ray/api/annotation/ResourceItem.java b/java/api/src/main/java/org/ray/api/annotation/ResourceItem.java
deleted file mode 100644
index f4895eba6164c..0000000000000
--- a/java/api/src/main/java/org/ray/api/annotation/ResourceItem.java
+++ /dev/null
@@ -1,28 +0,0 @@
-package org.ray.api.annotation;
-
-
-import java.lang.annotation.Documented;
-import java.lang.annotation.ElementType;
-import java.lang.annotation.Retention;
-import java.lang.annotation.RetentionPolicy;
-import java.lang.annotation.Target;
-
-/**
- * Represents a custom resource, including its name and quantity.
- */
-@Documented
-@Retention(RetentionPolicy.RUNTIME)
-@Target(ElementType.ANNOTATION_TYPE)
-public @interface ResourceItem {
-
-  /**
-   * Name of this resource, must not be null or empty.
-   */
-  String name();
-
-  /**
-   * Quantity of this resource.
-   */
-  double value() default 0;
-
-}
diff --git a/java/api/src/main/java/org/ray/api/id/UniqueId.java b/java/api/src/main/java/org/ray/api/id/UniqueId.java
index 0d32d0f8f3c4b..f93bdc737229e 100644
--- a/java/api/src/main/java/org/ray/api/id/UniqueId.java
+++ b/java/api/src/main/java/org/ray/api/id/UniqueId.java
@@ -112,6 +112,6 @@ public boolean equals(Object obj) {
 
   @Override
   public String toString() {
-    return DatatypeConverter.printHexBinary(id);
+    return DatatypeConverter.printHexBinary(id).toLowerCase();
   }
 }
diff --git a/java/api/src/main/java/org/ray/api/options/ActorCreationOptions.java b/java/api/src/main/java/org/ray/api/options/ActorCreationOptions.java
new file mode 100644
index 0000000000000..20db30944e513
--- /dev/null
+++ b/java/api/src/main/java/org/ray/api/options/ActorCreationOptions.java
@@ -0,0 +1,18 @@
+package org.ray.api.options;
+
+import java.util.Map;
+
+/**
+ * The options for creating actor.
+ */
+public class ActorCreationOptions extends BaseTaskOptions {
+
+  public ActorCreationOptions() {
+    super();
+  }
+
+  public ActorCreationOptions(Map<String, Double> resources) {
+    super(resources);
+  }
+
+}
diff --git a/java/api/src/main/java/org/ray/api/options/BaseTaskOptions.java b/java/api/src/main/java/org/ray/api/options/BaseTaskOptions.java
new file mode 100644
index 0000000000000..65494d532a687
--- /dev/null
+++ b/java/api/src/main/java/org/ray/api/options/BaseTaskOptions.java
@@ -0,0 +1,20 @@
+package org.ray.api.options;
+
+import java.util.HashMap;
+import java.util.Map;
+
+/**
+ * The options class for RayCall or ActorCreation.
+ */
+public abstract class BaseTaskOptions {
+  public Map<String, Double> resources;
+
+  public BaseTaskOptions() {
+    resources = new HashMap<>();
+  }
+
+  public BaseTaskOptions(Map<String, Double> resources) {
+    this.resources = resources;
+  }
+
+}
diff --git a/java/api/src/main/java/org/ray/api/options/CallOptions.java b/java/api/src/main/java/org/ray/api/options/CallOptions.java
new file mode 100644
index 0000000000000..84adfc122e04a
--- /dev/null
+++ b/java/api/src/main/java/org/ray/api/options/CallOptions.java
@@ -0,0 +1,18 @@
+package org.ray.api.options;
+
+import java.util.Map;
+
+/**
+ * The options for RayCall.
+ */
+public class CallOptions extends BaseTaskOptions {
+
+  public CallOptions() {
+    super();
+  }
+
+  public CallOptions(Map<String, Double> resources) {
+    super(resources);
+  }
+
+}
diff --git a/java/api/src/main/java/org/ray/api/runtime/RayRuntime.java b/java/api/src/main/java/org/ray/api/runtime/RayRuntime.java
index d609d4de593d1..7c12c3543c04a 100644
--- a/java/api/src/main/java/org/ray/api/runtime/RayRuntime.java
+++ b/java/api/src/main/java/org/ray/api/runtime/RayRuntime.java
@@ -6,6 +6,9 @@
 import org.ray.api.WaitResult;
 import org.ray.api.function.RayFunc;
 import org.ray.api.id.UniqueId;
+import org.ray.api.options.ActorCreationOptions;
+import org.ray.api.options.BaseTaskOptions;
+import org.ray.api.options.CallOptions;
 
 /**
  * Base interface of a Ray runtime.
@@ -65,9 +68,10 @@ public interface RayRuntime {
    *
    * @param func The remote function to run.
    * @param args The arguments of the remote function.
+   * @param options The options for this call.
    * @return The result object.
    */
-  RayObject call(RayFunc func, Object[] args);
+  RayObject call(RayFunc func, Object[] args, CallOptions options);
 
   /**
    * Invoke a remote function on an actor.
@@ -85,7 +89,9 @@ public interface RayRuntime {
    * @param actorFactoryFunc A remote function whose return value is the actor object.
    * @param args The arguments for the remote function.
    * @param <T> The type of the actor object.
+   * @param options The options for creating actor.
    * @return A handle to the actor.
    */
-  <T> RayActor<T> createActor(RayFunc actorFactoryFunc, Object[] args);
+  <T> RayActor<T> createActor(RayFunc actorFactoryFunc, Object[] args,
+      ActorCreationOptions options);
 }
diff --git a/java/checkstyle-suppressions.xml b/java/checkstyle-suppressions.xml
index 619c24e1466f0..0422332258dfa 100644
--- a/java/checkstyle-suppressions.xml
+++ b/java/checkstyle-suppressions.xml
@@ -10,5 +10,5 @@
   <suppress checks=".*" files="RayCall.java"/>
   <!-- suppress check for flatbuffer-generated files. -->
   <!-- TODO(raulchen): move these files to a directory, so this rule can be simplier. -->
-  <suppress checks=".*" files="(Arg|ResourcePair|TaskLanguage|TaskInfo|ClientTableData).java" />
+  <suppress checks=".*" files="(Arg|ResourcePair|Language|TaskInfo|ClientTableData).java" />
 </suppressions>
diff --git a/java/doc/installation.rst b/java/doc/installation.rst
index fca3b12e7c971..8daec29ace403 100644
--- a/java/doc/installation.rst
+++ b/java/doc/installation.rst
@@ -26,7 +26,7 @@ For Ubuntu users, run the following commands:
   # If you are on Ubuntu 14.04, you need the following.
   pip install cmake
 
-  pip install cython
+  pip install cython==0.27.3
 
 For macOS users, run the following commands:
 ::
@@ -34,7 +34,7 @@ For macOS users, run the following commands:
   brew update
   brew install maven cmake pkg-config automake autoconf libtool openssl bison wget
 
-  pip install cython
+  pip install cython==0.27.3
 
 Build Ray
 ^^^^^^^^^
diff --git a/java/prepare.sh b/java/prepare.sh
index 807301a74edba..9554e500a8edd 100755
--- a/java/prepare.sh
+++ b/java/prepare.sh
@@ -42,15 +42,15 @@ fi
 # echo "ray_dir = $ray_dir"
 
 declare -a nativeBinaries=(
-    "./src/common/thirdparty/redis/src/redis-server"
+    "./src/ray/thirdparty/redis/src/redis-server"
     "./src/plasma/plasma_store_server"
     "./src/ray/raylet/raylet"
     "./src/ray/raylet/raylet_monitor"
 )
 
 declare -a nativeLibraries=(
-    "./src/common/redis_module/libray_redis_module.so"
-    "./src/local_scheduler/liblocal_scheduler_library_java.*"
+    "./src/ray/gcs/redis_module/libray_redis_module.so"
+    "./src/ray/raylet/liblocal_scheduler_library_java.*"
     "./src/plasma/libplasma_java.*"
     "./src/ray/raylet/*lib.a"
 )
diff --git a/java/runtime/src/main/java/org/ray/runtime/AbstractRayRuntime.java b/java/runtime/src/main/java/org/ray/runtime/AbstractRayRuntime.java
index b035f3b52bc0c..10dc172fd4d99 100644
--- a/java/runtime/src/main/java/org/ray/runtime/AbstractRayRuntime.java
+++ b/java/runtime/src/main/java/org/ray/runtime/AbstractRayRuntime.java
@@ -10,8 +10,12 @@
 import org.ray.api.RayActor;
 import org.ray.api.RayObject;
 import org.ray.api.WaitResult;
+import org.ray.api.exception.RayException;
 import org.ray.api.function.RayFunc;
 import org.ray.api.id.UniqueId;
+import org.ray.api.options.ActorCreationOptions;
+import org.ray.api.options.BaseTaskOptions;
+import org.ray.api.options.CallOptions;
 import org.ray.api.runtime.RayRuntime;
 import org.ray.runtime.config.RayConfig;
 import org.ray.runtime.functionmanager.FunctionManager;
@@ -22,8 +26,7 @@
 import org.ray.runtime.task.ArgumentsBuilder;
 import org.ray.runtime.task.TaskSpec;
 import org.ray.runtime.util.ResourceUtil;
-import org.ray.runtime.util.UniqueIdHelper;
-import org.ray.runtime.util.exception.TaskExecutionException;
+import org.ray.runtime.util.UniqueIdUtil;
 import org.ray.runtime.util.logger.RayLog;
 
 /**
@@ -48,7 +51,7 @@ public abstract class AbstractRayRuntime implements RayRuntime {
 
   public AbstractRayRuntime(RayConfig rayConfig) {
     this.rayConfig = rayConfig;
-    functionManager = new FunctionManager();
+    functionManager = new FunctionManager(rayConfig.driverResourcePath);
     worker = new Worker(this);
     workerContext = new WorkerContext(rayConfig.workerMode, rayConfig.driverId);
   }
@@ -63,7 +66,7 @@ public AbstractRayRuntime(RayConfig rayConfig) {
 
   @Override
   public <T> RayObject<T> put(T obj) {
-    UniqueId objectId = UniqueIdHelper.computePutId(
+    UniqueId objectId = UniqueIdUtil.computePutId(
         workerContext.getCurrentTask().taskId, workerContext.nextPutIndex());
 
     put(objectId, obj);
@@ -72,12 +75,12 @@ public <T> RayObject<T> put(T obj) {
 
   public <T> void put(UniqueId objectId, T obj) {
     UniqueId taskId = workerContext.getCurrentTask().taskId;
-    RayLog.core.info("Putting object {}, for task {} ", objectId, taskId);
+    RayLog.core.debug("Putting object {}, for task {} ", objectId, taskId);
     objectStoreProxy.put(objectId, obj, null);
   }
 
   @Override
-  public <T> T get(UniqueId objectId) throws TaskExecutionException {
+  public <T> T get(UniqueId objectId) throws RayException {
     List<T> ret = get(ImmutableList.of(objectId));
     return ret.get(0);
   }
@@ -85,6 +88,8 @@ public <T> T get(UniqueId objectId) throws TaskExecutionException {
   @Override
   public <T> List<T> get(List<UniqueId> objectIds) {
     boolean wasBlocked = false;
+    // TODO(swang): If we are not on the main thread, then we should generate a
+    // random task ID to pass to the backend.
     UniqueId taskId = workerContext.getCurrentTask().taskId;
 
     try {
@@ -94,7 +99,7 @@ public <T> List<T> get(List<UniqueId> objectIds) {
       List<List<UniqueId>> fetchBatches =
           splitIntoBatches(objectIds, FETCH_BATCH_SIZE);
       for (List<UniqueId> batch : fetchBatches) {
-        rayletClient.reconstructObjects(batch, true);
+        rayletClient.fetchOrReconstruct(batch, true, taskId);
       }
 
       // Get the objects. We initially try to get the objects immediately.
@@ -119,7 +124,7 @@ public <T> List<T> get(List<UniqueId> objectIds) {
             splitIntoBatches(unreadyList, FETCH_BATCH_SIZE);
 
         for (List<UniqueId> batch : reconstructBatches) {
-          rayletClient.reconstructObjects(batch, false);
+          rayletClient.fetchOrReconstruct(batch, false, taskId);
         }
 
         List<Pair<T, GetStatus>> results = objectStoreProxy
@@ -146,7 +151,7 @@ public <T> List<T> get(List<UniqueId> objectIds) {
       }
 
       return finalRet;
-    } catch (TaskExecutionException e) {
+    } catch (RayException e) {
       RayLog.core.error("Task " + taskId + " Objects " + Arrays.toString(objectIds.toArray())
           + " get with Exception", e);
       throw e;
@@ -154,7 +159,7 @@ public <T> List<T> get(List<UniqueId> objectIds) {
       // If there were objects that we weren't able to get locally, let the local
       // scheduler know that we're now unblocked.
       if (wasBlocked) {
-        rayletClient.notifyUnblocked();
+        rayletClient.notifyUnblocked(taskId);
       }
     }
   }
@@ -182,12 +187,15 @@ private List<List<UniqueId>> splitIntoBatches(List<UniqueId> objectIds, int batc
 
   @Override
   public <T> WaitResult<T> wait(List<RayObject<T>> waitList, int numReturns, int timeoutMs) {
-    return rayletClient.wait(waitList, numReturns, timeoutMs);
+    // TODO(swang): If we are not on the main thread, then we should generate a
+    // random task ID to pass to the backend.
+    return rayletClient.wait(waitList, numReturns, timeoutMs,
+        workerContext.getCurrentTask().taskId);
   }
 
   @Override
-  public RayObject call(RayFunc func, Object[] args) {
-    TaskSpec spec = createTaskSpec(func, RayActorImpl.NIL, args, false);
+  public RayObject call(RayFunc func, Object[] args, CallOptions options) {
+    TaskSpec spec = createTaskSpec(func, RayActorImpl.NIL, args, false, options);
     rayletClient.submitTask(spec);
     return new RayObjectImpl(spec.returnIds[0]);
   }
@@ -198,7 +206,7 @@ public RayObject call(RayFunc func, RayActor actor, Object[] args) {
       throw new IllegalArgumentException("Unsupported actor type: " + actor.getClass().getName());
     }
     RayActorImpl actorImpl = (RayActorImpl)actor;
-    TaskSpec spec = createTaskSpec(func, actorImpl, args, false);
+    TaskSpec spec = createTaskSpec(func, actorImpl, args, false, null);
     spec.getExecutionDependencies().add(((RayActorImpl) actor).getTaskCursor());
     actorImpl.setTaskCursor(spec.returnIds[1]);
     rayletClient.submitTask(spec);
@@ -207,8 +215,10 @@ public RayObject call(RayFunc func, RayActor actor, Object[] args) {
 
   @Override
   @SuppressWarnings("unchecked")
-  public <T> RayActor<T> createActor(RayFunc actorFactoryFunc, Object[] args) {
-    TaskSpec spec = createTaskSpec(actorFactoryFunc, RayActorImpl.NIL, args, true);
+  public <T> RayActor<T> createActor(RayFunc actorFactoryFunc,
+      Object[] args, ActorCreationOptions options) {
+    TaskSpec spec = createTaskSpec(actorFactoryFunc, RayActorImpl.NIL,
+        args, true, options);
     RayActorImpl<?> actor = new RayActorImpl(spec.returnIds[0]);
     actor.increaseTaskCounter();
     actor.setTaskCursor(spec.returnIds[0]);
@@ -222,7 +232,7 @@ public <T> RayActor<T> createActor(RayFunc actorFactoryFunc, Object[] args) {
   private UniqueId[] genReturnIds(UniqueId taskId, int numReturns) {
     UniqueId[] ret = new UniqueId[numReturns];
     for (int i = 0; i < numReturns; i++) {
-      ret[i] = UniqueIdHelper.computeReturnId(taskId, i + 1);
+      ret[i] = UniqueIdUtil.computeReturnId(taskId, i + 1);
     }
     return ret;
   }
@@ -236,11 +246,10 @@ private UniqueId[] genReturnIds(UniqueId taskId, int numReturns) {
    * @return A TaskSpec object.
    */
   private TaskSpec createTaskSpec(RayFunc func, RayActorImpl actor, Object[] args,
-      boolean isActorCreationTask) {
+      boolean isActorCreationTask, BaseTaskOptions taskOptions) {
     final TaskSpec current = workerContext.getCurrentTask();
     UniqueId taskId = rayletClient.generateTaskId(current.driverId,
-        current.taskId,
-        workerContext.nextCallIndex());
+        current.taskId, workerContext.nextCallIndex());
     int numReturns = actor.getId().isNil() ? 1 : 2;
     UniqueId[] returnIds = genReturnIds(taskId, numReturns);
 
@@ -249,6 +258,18 @@ private TaskSpec createTaskSpec(RayFunc func, RayActorImpl actor, Object[] args,
       actorCreationId = returnIds[0];
     }
 
+    Map<String, Double> resources;
+    if (null == taskOptions) {
+      resources = new HashMap<>();
+    } else {
+      resources = new HashMap<>(taskOptions.resources);
+    }
+
+    if (!resources.containsKey(ResourceUtil.CPU_LITERAL)
+            && !resources.containsKey(ResourceUtil.CPU_LITERAL.toLowerCase())) {
+      resources.put(ResourceUtil.CPU_LITERAL, 0.0);
+    }
+
     RayFunction rayFunction = functionManager.getFunction(current.driverId, func);
     return new TaskSpec(
         current.driverId,
@@ -261,7 +282,7 @@ private TaskSpec createTaskSpec(RayFunc func, RayActorImpl actor, Object[] args,
         actor.increaseTaskCounter(),
         ArgumentsBuilder.wrap(args),
         returnIds,
-        ResourceUtil.getResourcesMapFromArray(rayFunction.getRayRemoteAnnotation()),
+        resources,
         rayFunction.getFunctionDescriptor()
     );
   }
@@ -286,4 +307,3 @@ public FunctionManager getFunctionManager() {
     return functionManager;
   }
 }
-
diff --git a/java/runtime/src/main/java/org/ray/runtime/config/RayConfig.java b/java/runtime/src/main/java/org/ray/runtime/config/RayConfig.java
index a2ef237e28068..d4d90f24ece27 100644
--- a/java/runtime/src/main/java/org/ray/runtime/config/RayConfig.java
+++ b/java/runtime/src/main/java/org/ray/runtime/config/RayConfig.java
@@ -6,11 +6,14 @@
 import com.typesafe.config.Config;
 import com.typesafe.config.ConfigException;
 import com.typesafe.config.ConfigFactory;
+
+import java.io.File;
 import java.util.List;
 import java.util.Map;
 import org.ray.api.id.UniqueId;
 import org.ray.runtime.util.NetworkUtil;
 import org.ray.runtime.util.ResourceUtil;
+import org.ray.runtime.util.StringUtil;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
@@ -35,6 +38,7 @@ public class RayConfig {
   public final boolean redirectOutput;
   public final List<String> libraryPath;
   public final List<String> classpath;
+  public final List<String> jvmParameters;
 
   private String redisAddress;
   private String redisIp;
@@ -51,6 +55,8 @@ public class RayConfig {
   public final String redisModulePath;
   public final String plasmaStoreExecutablePath;
   public final String rayletExecutablePath;
+  public final String driverResourcePath;
+  public final String pythonWorkerCommand;
 
   private void validate() {
     if (workerMode == WorkerMode.WORKER) {
@@ -126,6 +132,18 @@ public RayConfig(Config config) {
     List<String> customLibraryPath = config.getStringList("ray.library.path");
     // custom classpath
     classpath = config.getStringList("ray.classpath");
+    // custom worker jvm parameters
+    if (config.hasPath("ray.worker.jvm-parameters")) {
+      jvmParameters = config.getStringList("ray.worker.jvm-parameters");
+    } else {
+      jvmParameters = ImmutableList.of();
+    }
+
+    if (config.hasPath("ray.worker.python-command")) {
+      pythonWorkerCommand = config.getString("ray.worker.python-command");
+    } else {
+      pythonWorkerCommand = null;
+    }
 
     // redis configurations
     String redisAddress = config.getString("ray.redis.address");
@@ -147,15 +165,22 @@ public RayConfig(Config config) {
     // library path
     this.libraryPath = new ImmutableList.Builder<String>().add(
         rayHome + "/build/src/plasma",
-        rayHome + "/build/src/local_scheduler"
+        rayHome + "/build/src/ray/raylet"
     ).addAll(customLibraryPath).build();
 
     redisServerExecutablePath = rayHome +
-        "/build/src/common/thirdparty/redis/src/redis-server";
-    redisModulePath = rayHome + "/build/src/common/redis_module/libray_redis_module.so";
+        "/build/src/ray/thirdparty/redis/src/redis-server";
+    redisModulePath = rayHome + "/build/src/ray/gcs/redis_module/libray_redis_module.so";
     plasmaStoreExecutablePath = rayHome + "/build/src/plasma/plasma_store_server";
     rayletExecutablePath = rayHome + "/build/src/ray/raylet/raylet";
 
+    // driver resource path
+    if (config.hasPath("ray.driver.resource-path")) {
+      driverResourcePath = config.getString("ray.driver.resource-path");
+    } else {
+      driverResourcePath = null;
+    }
+
     // validate config
     validate();
     LOGGER.debug("Created config: {}", this);
@@ -219,9 +244,16 @@ public String toString() {
   */
   public static RayConfig create() {
     ConfigFactory.invalidateCaches();
-    Config config = ConfigFactory.systemProperties()
-        .withFallback(ConfigFactory.load(CUSTOM_CONFIG_FILE))
-        .withFallback(ConfigFactory.load(DEFAULT_CONFIG_FILE));
+    Config config = ConfigFactory.systemProperties();
+    String configPath = System.getProperty("ray.config");
+    if (StringUtil.isNullOrEmpty(configPath)) {
+      LOGGER.info("Loading config from \"ray.conf\" file in classpath.");
+      config = config.withFallback(ConfigFactory.load(CUSTOM_CONFIG_FILE));
+    } else {
+      LOGGER.info("Loading config from " + configPath + ".");
+      config = config.withFallback(ConfigFactory.parseFile(new File(configPath)));
+    }
+    config = config.withFallback(ConfigFactory.load(DEFAULT_CONFIG_FILE));
     return new RayConfig(config);
   }
 
diff --git a/java/runtime/src/main/java/org/ray/runtime/functionmanager/FunctionManager.java b/java/runtime/src/main/java/org/ray/runtime/functionmanager/FunctionManager.java
index e586741641ae0..d7698c22aa7fb 100644
--- a/java/runtime/src/main/java/org/ray/runtime/functionmanager/FunctionManager.java
+++ b/java/runtime/src/main/java/org/ray/runtime/functionmanager/FunctionManager.java
@@ -15,20 +15,25 @@
 import org.objectweb.asm.Type;
 import org.ray.api.function.RayFunc;
 import org.ray.api.id.UniqueId;
+import org.ray.runtime.util.JarLoader;
 import org.ray.runtime.util.LambdaUtils;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
 
 /**
  * Manages functions by driver id.
  */
 public class FunctionManager {
 
+  private static final Logger LOGGER = LoggerFactory.getLogger(FunctionManager.class);
+
   static final String CONSTRUCTOR_NAME = "<init>";
 
   /**
    * Cache from a RayFunc object to its corresponding FunctionDescriptor. Because
    * `LambdaUtils.getSerializedLambda` is expensive.
    */
-  private static final ThreadLocal<WeakHashMap<Class<RayFunc>, FunctionDescriptor>>
+  private static final ThreadLocal<WeakHashMap<Class<? extends RayFunc>, FunctionDescriptor>>
       RAY_FUNC_CACHE = ThreadLocal.withInitial(WeakHashMap::new);
 
   /**
@@ -36,6 +41,21 @@ public class FunctionManager {
    */
   private Map<UniqueId, DriverFunctionTable> driverFunctionTables = new HashMap<>();
 
+  /**
+   * The resource path which we can load the driver's jar resources.
+   */
+  private String driverResourcePath;
+
+  /**
+   * Construct a FunctionManager with the specified driver resource path.
+   *
+   * @param driverResourcePath The specified driver resource that
+   *     can store the driver's resources.
+   */
+  public FunctionManager(String driverResourcePath) {
+    this.driverResourcePath = driverResourcePath;
+  }
+
   /**
    * Get the RayFunction from a RayFunc instance (a lambda).
    *
@@ -51,6 +71,7 @@ public RayFunction getFunction(UniqueId driverId, RayFunc func) {
       final String methodName = serializedLambda.getImplMethodName();
       final String typeDescriptor = serializedLambda.getImplMethodSignature();
       functionDescriptor = new FunctionDescriptor(className, methodName, typeDescriptor);
+      RAY_FUNC_CACHE.get().put(func.getClass(),functionDescriptor);
     }
     return getFunction(driverId, functionDescriptor);
   }
@@ -65,8 +86,17 @@ public RayFunction getFunction(UniqueId driverId, RayFunc func) {
   public RayFunction getFunction(UniqueId driverId, FunctionDescriptor functionDescriptor) {
     DriverFunctionTable driverFunctionTable = driverFunctionTables.get(driverId);
     if (driverFunctionTable == null) {
-      //TODO(hchen): distinguish class loader by driver id.
-      ClassLoader classLoader = getClass().getClassLoader();
+      String resourcePath = driverResourcePath + "/" + driverId.toString() + "/";
+      ClassLoader classLoader;
+
+      if (driverResourcePath != null && !driverResourcePath.isEmpty()) {
+        classLoader = JarLoader.loadJars(resourcePath, false);
+        LOGGER.info("Succeeded to load driver({}) resource. Resource path is {}",
+            driverId, resourcePath);
+      } else {
+        classLoader = getClass().getClassLoader();
+      }
+
       driverFunctionTable = new DriverFunctionTable(classLoader);
       driverFunctionTables.put(driverId, driverFunctionTable);
     }
diff --git a/java/runtime/src/main/java/org/ray/runtime/functionmanager/RayFunction.java b/java/runtime/src/main/java/org/ray/runtime/functionmanager/RayFunction.java
index 3d0704c6bf484..2f39ec3dc8db4 100644
--- a/java/runtime/src/main/java/org/ray/runtime/functionmanager/RayFunction.java
+++ b/java/runtime/src/main/java/org/ray/runtime/functionmanager/RayFunction.java
@@ -58,12 +58,17 @@ public FunctionDescriptor getFunctionDescriptor() {
   }
 
   public RayRemote getRayRemoteAnnotation() {
-    RayRemote rayRemote = executable.getAnnotation(RayRemote.class);
-    if (rayRemote == null) {
-      // If the method doesn't have a annotation, get the annotation from
-      // its wrapping class.
+    RayRemote rayRemote;
+
+    // If this method is a constructor, the task of it should be a actorCreationTask.
+    // And the annotation of actorCreationTask should inherit from class.
+    // Otherwise, it's a normal method, and it shouldn't inherit annotation from class.
+    if (isConstructor()) {
       rayRemote = executable.getDeclaringClass().getAnnotation(RayRemote.class);
+    } else {
+      rayRemote = executable.getAnnotation(RayRemote.class);
     }
+
     return rayRemote;
   }
 
diff --git a/java/runtime/src/main/java/org/ray/runtime/generated/TaskLanguage.java b/java/runtime/src/main/java/org/ray/runtime/generated/Language.java
similarity index 51%
rename from java/runtime/src/main/java/org/ray/runtime/generated/TaskLanguage.java
rename to java/runtime/src/main/java/org/ray/runtime/generated/Language.java
index e5e53614aa8a7..34604374dd441 100644
--- a/java/runtime/src/main/java/org/ray/runtime/generated/TaskLanguage.java
+++ b/java/runtime/src/main/java/org/ray/runtime/generated/Language.java
@@ -2,13 +2,13 @@
 
 package org.ray.runtime.generated;
 
-public final class TaskLanguage {
-  private TaskLanguage() { }
+public final class Language {
+  private Language() { }
   public static final int PYTHON = 0;
-  public static final int JAVA = 1;
+  public static final int CPP = 1;
+  public static final int JAVA = 2;
 
-  public static final String[] names = { "PYTHON", "JAVA", };
+  public static final String[] names = { "PYTHON", "CPP", "JAVA", };
 
   public static String name(int e) { return names[e]; }
 }
-
diff --git a/java/runtime/src/main/java/org/ray/runtime/generated/TaskInfo.java b/java/runtime/src/main/java/org/ray/runtime/generated/TaskInfo.java
index 8c0512afbc4fc..01113096036fc 100644
--- a/java/runtime/src/main/java/org/ray/runtime/generated/TaskInfo.java
+++ b/java/runtime/src/main/java/org/ray/runtime/generated/TaskInfo.java
@@ -48,9 +48,12 @@ public final class TaskInfo extends Table {
   public ResourcePair requiredResources(int j) { return requiredResources(new ResourcePair(), j); }
   public ResourcePair requiredResources(ResourcePair obj, int j) { int o = __offset(30); return o != 0 ? obj.__assign(__indirect(__vector(o) + j * 4), bb) : null; }
   public int requiredResourcesLength() { int o = __offset(30); return o != 0 ? __vector_len(o) : 0; }
-  public int language() { int o = __offset(32); return o != 0 ? bb.getInt(o + bb_pos) : 0; }
-  public String functionDescriptor(int j) { int o = __offset(34); return o != 0 ? __string(__vector(o) + j * 4) : null; }
-  public int functionDescriptorLength() { int o = __offset(34); return o != 0 ? __vector_len(o) : 0; }
+  public ResourcePair requiredPlacementResources(int j) { return requiredPlacementResources(new ResourcePair(), j); }
+  public ResourcePair requiredPlacementResources(ResourcePair obj, int j) { int o = __offset(32); return o != 0 ? obj.__assign(__indirect(__vector(o) + j * 4), bb) : null; }
+  public int requiredPlacementResourcesLength() { int o = __offset(32); return o != 0 ? __vector_len(o) : 0; }
+  public int language() { int o = __offset(34); return o != 0 ? bb.getInt(o + bb_pos) : 0; }
+  public String functionDescriptor(int j) { int o = __offset(36); return o != 0 ? __string(__vector(o) + j * 4) : null; }
+  public int functionDescriptorLength() { int o = __offset(36); return o != 0 ? __vector_len(o) : 0; }
 
   public static int createTaskInfo(FlatBufferBuilder builder,
       int driver_idOffset,
@@ -67,11 +70,13 @@ public static int createTaskInfo(FlatBufferBuilder builder,
       int argsOffset,
       int returnsOffset,
       int required_resourcesOffset,
+      int required_placement_resourcesOffset,
       int language,
       int function_descriptorOffset) {
-    builder.startObject(16);
+    builder.startObject(17);
     TaskInfo.addFunctionDescriptor(builder, function_descriptorOffset);
     TaskInfo.addLanguage(builder, language);
+    TaskInfo.addRequiredPlacementResources(builder, required_placement_resourcesOffset);
     TaskInfo.addRequiredResources(builder, required_resourcesOffset);
     TaskInfo.addReturns(builder, returnsOffset);
     TaskInfo.addArgs(builder, argsOffset);
@@ -89,7 +94,7 @@ public static int createTaskInfo(FlatBufferBuilder builder,
     return TaskInfo.endTaskInfo(builder);
   }
 
-  public static void startTaskInfo(FlatBufferBuilder builder) { builder.startObject(16); }
+  public static void startTaskInfo(FlatBufferBuilder builder) { builder.startObject(17); }
   public static void addDriverId(FlatBufferBuilder builder, int driverIdOffset) { builder.addOffset(0, driverIdOffset, 0); }
   public static void addTaskId(FlatBufferBuilder builder, int taskIdOffset) { builder.addOffset(1, taskIdOffset, 0); }
   public static void addParentTaskId(FlatBufferBuilder builder, int parentTaskIdOffset) { builder.addOffset(2, parentTaskIdOffset, 0); }
@@ -110,8 +115,11 @@ public static int createTaskInfo(FlatBufferBuilder builder,
   public static void addRequiredResources(FlatBufferBuilder builder, int requiredResourcesOffset) { builder.addOffset(13, requiredResourcesOffset, 0); }
   public static int createRequiredResourcesVector(FlatBufferBuilder builder, int[] data) { builder.startVector(4, data.length, 4); for (int i = data.length - 1; i >= 0; i--) builder.addOffset(data[i]); return builder.endVector(); }
   public static void startRequiredResourcesVector(FlatBufferBuilder builder, int numElems) { builder.startVector(4, numElems, 4); }
-  public static void addLanguage(FlatBufferBuilder builder, int language) { builder.addInt(14, language, 0); }
-  public static void addFunctionDescriptor(FlatBufferBuilder builder, int functionDescriptorOffset) { builder.addOffset(15, functionDescriptorOffset, 0); }
+  public static void addRequiredPlacementResources(FlatBufferBuilder builder, int requiredPlacementResourcesOffset) { builder.addOffset(14, requiredPlacementResourcesOffset, 0); }
+  public static int createRequiredPlacementResourcesVector(FlatBufferBuilder builder, int[] data) { builder.startVector(4, data.length, 4); for (int i = data.length - 1; i >= 0; i--) builder.addOffset(data[i]); return builder.endVector(); }
+  public static void startRequiredPlacementResourcesVector(FlatBufferBuilder builder, int numElems) { builder.startVector(4, numElems, 4); }
+  public static void addLanguage(FlatBufferBuilder builder, int language) { builder.addInt(15, language, 0); }
+  public static void addFunctionDescriptor(FlatBufferBuilder builder, int functionDescriptorOffset) { builder.addOffset(16, functionDescriptorOffset, 0); }
   public static int createFunctionDescriptorVector(FlatBufferBuilder builder, int[] data) { builder.startVector(4, data.length, 4); for (int i = data.length - 1; i >= 0; i--) builder.addOffset(data[i]); return builder.endVector(); }
   public static void startFunctionDescriptorVector(FlatBufferBuilder builder, int numElems) { builder.startVector(4, numElems, 4); }
   public static int endTaskInfo(FlatBufferBuilder builder) {
@@ -136,4 +144,3 @@ public ByteBuffer returnsAsByteBuffer(int j) {
     return src;
   }
 }
-
diff --git a/java/runtime/src/main/java/org/ray/runtime/objectstore/ObjectStoreProxy.java b/java/runtime/src/main/java/org/ray/runtime/objectstore/ObjectStoreProxy.java
index b497f5c44b148..5f8221ff6f028 100644
--- a/java/runtime/src/main/java/org/ray/runtime/objectstore/ObjectStoreProxy.java
+++ b/java/runtime/src/main/java/org/ray/runtime/objectstore/ObjectStoreProxy.java
@@ -4,10 +4,11 @@
 import java.util.List;
 import org.apache.arrow.plasma.ObjectStoreLink;
 import org.apache.commons.lang3.tuple.Pair;
+import org.ray.api.exception.RayException;
 import org.ray.api.id.UniqueId;
 import org.ray.runtime.AbstractRayRuntime;
 import org.ray.runtime.util.Serializer;
-import org.ray.runtime.util.exception.TaskExecutionException;
+import org.ray.runtime.util.UniqueIdUtil;
 
 /**
  * Object store proxy, which handles serialization and deserialization, and utilize a {@code
@@ -15,9 +16,10 @@
  */
 public class ObjectStoreProxy {
 
+  private static final int GET_TIMEOUT_MS = 1000;
+
   private final AbstractRayRuntime runtime;
   private final ObjectStoreLink store;
-  private final int getTimeoutMs = 1000;
 
   public ObjectStoreProxy(AbstractRayRuntime runtime, ObjectStoreLink store) {
     this.runtime = runtime;
@@ -25,18 +27,18 @@ public ObjectStoreProxy(AbstractRayRuntime runtime, ObjectStoreLink store) {
   }
 
   public <T> Pair<T, GetStatus> get(UniqueId objectId, boolean isMetadata)
-      throws TaskExecutionException {
-    return get(objectId, getTimeoutMs, isMetadata);
+      throws RayException {
+    return get(objectId, GET_TIMEOUT_MS, isMetadata);
   }
 
   public <T> Pair<T, GetStatus> get(UniqueId id, int timeoutMs, boolean isMetadata)
-      throws TaskExecutionException {
+      throws RayException {
     byte[] obj = store.get(id.getBytes(), timeoutMs, isMetadata);
     if (obj != null) {
       T t = Serializer.decode(obj, runtime.getWorkerContext().getCurrentClassLoader());
       store.release(id.getBytes());
-      if (t instanceof TaskExecutionException) {
-        throw (TaskExecutionException) t;
+      if (t instanceof RayException) {
+        throw (RayException) t;
       }
       return Pair.of(t, GetStatus.SUCCESS);
     } else {
@@ -45,21 +47,21 @@ public <T> Pair<T, GetStatus> get(UniqueId id, int timeoutMs, boolean isMetadata
   }
 
   public <T> List<Pair<T, GetStatus>> get(List<UniqueId> objectIds, boolean isMetadata)
-      throws TaskExecutionException {
-    return get(objectIds, getTimeoutMs, isMetadata);
+      throws RayException {
+    return get(objectIds, GET_TIMEOUT_MS, isMetadata);
   }
 
   public <T> List<Pair<T, GetStatus>> get(List<UniqueId> ids, int timeoutMs, boolean isMetadata)
-      throws TaskExecutionException {
-    List<byte[]> objs = store.get(getIdBytes(ids), timeoutMs, isMetadata);
+      throws RayException {
+    List<byte[]> objs = store.get(UniqueIdUtil.getIdBytes(ids), timeoutMs, isMetadata);
     List<Pair<T, GetStatus>> ret = new ArrayList<>();
     for (int i = 0; i < objs.size(); i++) {
       byte[] obj = objs.get(i);
       if (obj != null) {
         T t = Serializer.decode(obj, runtime.getWorkerContext().getCurrentClassLoader());
         store.release(ids.get(i).getBytes());
-        if (t instanceof TaskExecutionException) {
-          throw (TaskExecutionException) t;
+        if (t instanceof RayException) {
+          throw (RayException) t;
         }
         ret.add(Pair.of(t, GetStatus.SUCCESS));
       } else {
@@ -69,15 +71,6 @@ public <T> List<Pair<T, GetStatus>> get(List<UniqueId> ids, int timeoutMs, boole
     return ret;
   }
 
-  private static byte[][] getIdBytes(List<UniqueId> objectIds) {
-    int size = objectIds.size();
-    byte[][] ids = new byte[size][];
-    for (int i = 0; i < size; i++) {
-      ids[i] = objectIds.get(i).getBytes();
-    }
-    return ids;
-  }
-
   public void put(UniqueId id, Object obj, Object metadata) {
     store.put(id.getBytes(), Serializer.encode(obj), Serializer.encode(metadata));
   }
diff --git a/java/runtime/src/main/java/org/ray/runtime/raylet/MockRayletClient.java b/java/runtime/src/main/java/org/ray/runtime/raylet/MockRayletClient.java
index 95a8abdf4274d..dbe2cd3b6329b 100644
--- a/java/runtime/src/main/java/org/ray/runtime/raylet/MockRayletClient.java
+++ b/java/runtime/src/main/java/org/ray/runtime/raylet/MockRayletClient.java
@@ -6,6 +6,7 @@
 import java.util.concurrent.ConcurrentHashMap;
 import org.ray.api.RayObject;
 import org.ray.api.WaitResult;
+import org.ray.api.exception.RayException;
 import org.ray.api.id.UniqueId;
 import org.ray.runtime.RayDevRuntime;
 import org.ray.runtime.objectstore.MockObjectStore;
@@ -66,12 +67,13 @@ public TaskSpec getTask() {
   }
 
   @Override
-  public void reconstructObjects(List<UniqueId> objectIds, boolean fetchOnly) {
+  public void fetchOrReconstruct(List<UniqueId> objectIds, boolean fetchOnly,
+      UniqueId currentTaskId) throws RayException {
 
   }
 
   @Override
-  public void notifyUnblocked() {
+  public void notifyUnblocked(UniqueId currentTaskId) {
 
   }
 
@@ -81,7 +83,8 @@ public UniqueId generateTaskId(UniqueId driverId, UniqueId parentTaskId, int tas
   }
 
   @Override
-  public <T> WaitResult<T> wait(List<RayObject<T>> waitFor, int numReturns, int timeoutMs) {
+  public <T> WaitResult<T> wait(List<RayObject<T>> waitFor, int numReturns, int
+      timeoutMs, UniqueId currentTaskId) {
     return new WaitResult<T>(
         waitFor,
         ImmutableList.of()
diff --git a/java/runtime/src/main/java/org/ray/runtime/raylet/RayletClient.java b/java/runtime/src/main/java/org/ray/runtime/raylet/RayletClient.java
index baa32a1425334..3e3f4f1e72918 100644
--- a/java/runtime/src/main/java/org/ray/runtime/raylet/RayletClient.java
+++ b/java/runtime/src/main/java/org/ray/runtime/raylet/RayletClient.java
@@ -3,6 +3,7 @@
 import java.util.List;
 import org.ray.api.RayObject;
 import org.ray.api.WaitResult;
+import org.ray.api.exception.RayException;
 import org.ray.api.id.UniqueId;
 import org.ray.runtime.task.TaskSpec;
 
@@ -15,13 +16,15 @@ public interface RayletClient {
 
   TaskSpec getTask();
 
-  void reconstructObjects(List<UniqueId> objectIds, boolean fetchOnly);
+  void fetchOrReconstruct(List<UniqueId> objectIds, boolean fetchOnly, UniqueId currentTaskId)
+      throws RayException;
 
-  void notifyUnblocked();
+  void notifyUnblocked(UniqueId currentTaskId);
 
   UniqueId generateTaskId(UniqueId driverId, UniqueId parentTaskId, int taskIndex);
 
-  <T> WaitResult<T> wait(List<RayObject<T>> waitFor, int numReturns, int timeoutMs);
+  <T> WaitResult<T> wait(List<RayObject<T>> waitFor, int numReturns, int
+      timeoutMs, UniqueId currentTaskId);
 
   void freePlasmaObjects(List<UniqueId> objectIds, boolean localOnly);
 }
diff --git a/java/runtime/src/main/java/org/ray/runtime/raylet/RayletClientImpl.java b/java/runtime/src/main/java/org/ray/runtime/raylet/RayletClientImpl.java
index 1a78f22debec9..cd4f3fd313c6d 100644
--- a/java/runtime/src/main/java/org/ray/runtime/raylet/RayletClientImpl.java
+++ b/java/runtime/src/main/java/org/ray/runtime/raylet/RayletClientImpl.java
@@ -10,15 +10,16 @@
 import java.util.Map;
 import org.ray.api.RayObject;
 import org.ray.api.WaitResult;
+import org.ray.api.exception.RayException;
 import org.ray.api.id.UniqueId;
 import org.ray.runtime.functionmanager.FunctionDescriptor;
 import org.ray.runtime.generated.Arg;
+import org.ray.runtime.generated.Language;
 import org.ray.runtime.generated.ResourcePair;
 import org.ray.runtime.generated.TaskInfo;
-import org.ray.runtime.generated.TaskLanguage;
 import org.ray.runtime.task.FunctionArg;
 import org.ray.runtime.task.TaskSpec;
-import org.ray.runtime.util.UniqueIdHelper;
+import org.ray.runtime.util.UniqueIdUtil;
 import org.ray.runtime.util.logger.RayLog;
 
 public class RayletClientImpl implements RayletClient {
@@ -44,13 +45,15 @@ public RayletClientImpl(String schedulerSockName, UniqueId clientId,
   }
 
   @Override
-  public <T> WaitResult<T> wait(List<RayObject<T>> waitFor, int numReturns, int timeoutMs) {
+  public <T> WaitResult<T> wait(List<RayObject<T>> waitFor, int numReturns, int
+      timeoutMs, UniqueId currentTaskId) {
     List<UniqueId> ids = new ArrayList<>();
     for (RayObject<T> element : waitFor) {
       ids.add(element.getId());
     }
 
-    boolean[] ready = nativeWaitObject(client, getIdBytes(ids), numReturns, timeoutMs, false);
+    boolean[] ready = nativeWaitObject(client, UniqueIdUtil.getIdBytes(ids),
+        numReturns, timeoutMs, false, currentTaskId.getBytes());
     List<RayObject<T>> readyList = new ArrayList<>();
     List<RayObject<T>> unreadyList = new ArrayList<>();
 
@@ -86,12 +89,17 @@ public TaskSpec getTask() {
   }
 
   @Override
-  public void reconstructObjects(List<UniqueId> objectIds, boolean fetchOnly) {
-    if (RayLog.core.isInfoEnabled()) {
-      RayLog.core.info("Reconstructing objects for task {}, object IDs are {}",
-          UniqueIdHelper.computeTaskId(objectIds.get(0)), objectIds);
+  public void fetchOrReconstruct(List<UniqueId> objectIds, boolean fetchOnly,
+      UniqueId currentTaskId) throws RayException {
+    if (RayLog.core.isDebugEnabled()) {
+      RayLog.core.debug("Blocked on objects for task {}, object IDs are {}",
+          UniqueIdUtil.computeTaskId(objectIds.get(0)), objectIds);
+    }
+    int ret = nativeFetchOrReconstruct(client, UniqueIdUtil.getIdBytes(objectIds),
+        fetchOnly, currentTaskId.getBytes());
+    if (ret != 0) {
+      throw new RayException("Connection closed by Raylet");
     }
-    nativeReconstructObjects(client, getIdBytes(objectIds), fetchOnly);
   }
 
   @Override
@@ -101,13 +109,13 @@ public UniqueId generateTaskId(UniqueId driverId, UniqueId parentTaskId, int tas
   }
 
   @Override
-  public void notifyUnblocked() {
-    nativeNotifyUnblocked(client);
+  public void notifyUnblocked(UniqueId currentTaskId) {
+    nativeNotifyUnblocked(client, currentTaskId.getBytes());
   }
 
   @Override
   public void freePlasmaObjects(List<UniqueId> objectIds, boolean localOnly) {
-    byte[][] objectIdsArray = getIdBytes(objectIds);
+    byte[][] objectIdsArray = UniqueIdUtil.getIdBytes(objectIds);
     nativeFreePlasmaObjects(client, objectIdsArray, localOnly);
   }
 
@@ -168,7 +176,7 @@ private static ByteBuffer convertTaskSpecToFlatbuffer(TaskSpec task) {
     final int parentTaskIdOffset = fbb.createString(task.parentTaskId.toByteBuffer());
     final int parentCounter = task.parentCounter;
     final int actorCreateIdOffset = fbb.createString(task.actorCreationId.toByteBuffer());
-    final int actorCreateDummyIdOffset = fbb.createString(UniqueId.NIL.toByteBuffer());
+    final int actorCreateDummyIdOffset = fbb.createString(task.actorId.toByteBuffer());
     final int actorIdOffset = fbb.createString(task.actorId.toByteBuffer());
     final int actorHandleIdOffset = fbb.createString(task.actorHandleId.toByteBuffer());
     final int actorCounter = task.actorCounter;
@@ -209,6 +217,11 @@ private static ByteBuffer convertTaskSpecToFlatbuffer(TaskSpec task) {
           ResourcePair.createResourcePair(fbb, keyOffset, entry.getValue());
     }
     int requiredResourcesOffset = fbb.createVectorOfTables(requiredResourcesOffsets);
+
+    int[] requiredPlacementResourcesOffsets = new int[0];
+    int requiredPlacementResourcesOffset =
+        fbb.createVectorOfTables(requiredPlacementResourcesOffsets);
+
     int[] functionDescriptorOffsets = new int[]{
         fbb.createString(task.functionDescriptor.className),
         fbb.createString(task.functionDescriptor.name),
@@ -222,7 +235,8 @@ private static ByteBuffer convertTaskSpecToFlatbuffer(TaskSpec task) {
         actorCreateIdOffset, actorCreateDummyIdOffset,
         actorIdOffset, actorHandleIdOffset, actorCounter,
         false, functionIdOffset,
-        argsOffset, returnsOffset, requiredResourcesOffset, TaskLanguage.JAVA,
+        argsOffset, returnsOffset, requiredResourcesOffset,
+        requiredPlacementResourcesOffset, Language.JAVA,
         functionDescriptorOffset);
     fbb.finish(root);
     ByteBuffer buffer = fbb.dataBuffer();
@@ -236,15 +250,6 @@ private static ByteBuffer convertTaskSpecToFlatbuffer(TaskSpec task) {
     return buffer;
   }
 
-  private static byte[][] getIdBytes(List<UniqueId> objectIds) {
-    int size = objectIds.size();
-    byte[][] ids = new byte[size][];
-    for (int i = 0; i < size; i++) {
-      ids[i] = objectIds.get(i).getBytes();
-    }
-    return ids;
-  }
-
   public void destroy() {
     nativeDestroy(client);
   }
@@ -258,8 +263,8 @@ public void destroy() {
   /// 1) pushd $Dir/java/runtime/target/classes
   /// 2) javah -classpath .:$Dir/java/api/target/classes org.ray.runtime.raylet.RayletClientImpl
   /// 3) clang-format -i org_ray_runtime_raylet_RayletClientImpl.h
-  /// 4) cp org_ray_runtime_raylet_RayletClientImpl.h $Dir/src/local_scheduler/lib/java/
-  /// 5) vim $Dir/src/local_scheduler/lib/java/org_ray_runtime_raylet_RayletClientImpl.cc
+  /// 4) cp org_ray_runtime_raylet_RayletClientImpl.h $Dir/src/ray/raylet/lib/java/
+  /// 5) vim $Dir/src/ray/raylet/lib/java/org_ray_runtime_raylet_RayletClientImpl.cc
   /// 6) popd
 
   private static native long nativeInit(String localSchedulerSocket, byte[] workerId,
@@ -273,15 +278,15 @@ private static native void nativeSubmitTask(long client, byte[] cursorId, ByteBu
 
   private static native void nativeDestroy(long client);
 
-  private static native void nativeReconstructObjects(long client, byte[][] objectIds,
-      boolean fetchOnly);
+  private static native int nativeFetchOrReconstruct(long client, byte[][] objectIds,
+      boolean fetchOnly, byte[] currentTaskId);
 
-  private static native void nativeNotifyUnblocked(long client);
+  private static native void nativeNotifyUnblocked(long client, byte[] currentTaskId);
 
   private static native void nativePutObject(long client, byte[] taskId, byte[] objectId);
 
   private static native boolean[] nativeWaitObject(long conn, byte[][] objectIds,
-      int numReturns, int timeout, boolean waitLocal);
+      int numReturns, int timeout, boolean waitLocal, byte[] currentTaskId);
 
   private static native byte[] nativeGenerateTaskId(byte[] driverId, byte[] parentTaskId,
       int taskIndex);
diff --git a/java/runtime/src/main/java/org/ray/runtime/runner/RunManager.java b/java/runtime/src/main/java/org/ray/runtime/runner/RunManager.java
index 03429c963a3a5..56940e33cbcfd 100644
--- a/java/runtime/src/main/java/org/ray/runtime/runner/RunManager.java
+++ b/java/runtime/src/main/java/org/ray/runtime/runner/RunManager.java
@@ -179,13 +179,16 @@ private void startRaylet() {
         rayConfig.rayletExecutablePath,
         rayConfig.rayletSocketName,
         rayConfig.objectStoreSocketName,
+        "0",  // The object manager port.
+        "0",  // The node manager port.
         rayConfig.nodeIp,
         rayConfig.getRedisIp(),
         rayConfig.getRedisPort().toString(),
         "0", // number of initial workers
         String.valueOf(maximumStartupConcurrency),
         ResourceUtil.getResourcesStringFromMap(rayConfig.resources),
-        "", // python worker command
+        "",  // The internal config list.
+        buildPythonWorkerCommand(), // python worker command
         buildWorkerCommandRaylet() // java worker command
     );
 
@@ -205,8 +208,8 @@ private String buildWorkerCommandRaylet() {
 
     // Generate classpath based on current classpath + user-defined classpath.
     String classpath = concatPath(Stream.concat(
-        Stream.of(System.getProperty("java.class.path").split(":")),
-        rayConfig.classpath.stream()
+        rayConfig.classpath.stream(),
+        Stream.of(System.getProperty("java.class.path").split(":"))
     ));
     cmd.add(classpath);
 
@@ -227,6 +230,8 @@ private String buildWorkerCommandRaylet() {
     // Config overwrite
     cmd.add("-Dray.redis.address=" + rayConfig.getRedisAddress());
 
+    cmd.addAll(rayConfig.jvmParameters);
+
     // Main class
     cmd.add(WORKER_CLASS);
     String command = Joiner.on(" ").join(cmd);
@@ -245,4 +250,22 @@ private void startObjectStore() {
     startProcess(command, null, "plasma_store");
   }
 
+  private String buildPythonWorkerCommand() {
+    // disable python worker start from raylet, which starts from java
+    if (rayConfig.pythonWorkerCommand == null) {
+      return "";
+    }
+
+    List<String> cmd = new ArrayList<>();
+    cmd.add(rayConfig.pythonWorkerCommand);
+    cmd.add("--node-ip-address=" + rayConfig.nodeIp);
+    cmd.add("--object-store-name=" + rayConfig.objectStoreSocketName);
+    cmd.add("--raylet-name=" + rayConfig.rayletSocketName);
+    cmd.add("--redis-address=" + rayConfig.getRedisAddress());
+
+    String command = cmd.stream().collect(Collectors.joining(" "));
+    LOGGER.debug("python worker command: {}", command);
+    return command;
+  }
+
 }
diff --git a/java/runtime/src/main/java/org/ray/runtime/util/JarLoader.java b/java/runtime/src/main/java/org/ray/runtime/util/JarLoader.java
index 8a66923e3464a..c6ab5650c038f 100644
--- a/java/runtime/src/main/java/org/ray/runtime/util/JarLoader.java
+++ b/java/runtime/src/main/java/org/ray/runtime/util/JarLoader.java
@@ -14,13 +14,16 @@
 import org.apache.commons.io.IOUtils;
 import org.apache.commons.io.filefilter.DirectoryFileFilter;
 import org.apache.commons.io.filefilter.RegexFileFilter;
-import org.ray.runtime.util.logger.RayLog;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
 
 /**
  * load and unload jars from a dir.
  */
 public class JarLoader {
 
+  private static final Logger LOGGER = LoggerFactory.getLogger(JarLoader.class);
+
   public static URLClassLoader loadJars(String dir, boolean explicitLoad) {
     // get all jars
     Collection<File> jars = FileUtils.listFiles(
@@ -42,7 +45,7 @@ private static URLClassLoader loadJar(Collection<File> appJars, boolean explicit
 
     for (File appJar : appJars) {
       try {
-        RayLog.core.info("load jar " + appJar.getAbsolutePath());
+        LOGGER.info("succeeded to load jar {}.", appJar.getAbsolutePath());
         JarFile jar = new JarFile(appJar.getAbsolutePath());
         jars.add(jar);
         urls.add(appJar.toURI().toURL());
diff --git a/java/runtime/src/main/java/org/ray/runtime/util/ResourceUtil.java b/java/runtime/src/main/java/org/ray/runtime/util/ResourceUtil.java
index 98cc436312423..4863ca5d13c1d 100644
--- a/java/runtime/src/main/java/org/ray/runtime/util/ResourceUtil.java
+++ b/java/runtime/src/main/java/org/ray/runtime/util/ResourceUtil.java
@@ -2,59 +2,11 @@
 
 import java.util.HashMap;
 import java.util.Map;
-import org.ray.api.annotation.RayRemote;
-import org.ray.api.annotation.ResourceItem;
 
 public class ResourceUtil {
   public static final String CPU_LITERAL = "CPU";
   public static final String GPU_LITERAL = "GPU";
 
-  /**
-   * Convert the array that contains resource items to a map.
-   *
-   * @param remoteAnnotation The RayRemote annotation that contains the resource items.
-   * @return The map whose key represents the resource name
-   *     and the value represents the resource quantity.
-   */
-  public static Map<String, Double> getResourcesMapFromArray(RayRemote remoteAnnotation) {
-    Map<String, Double> resourceMap = new HashMap<>();
-    if (remoteAnnotation != null) {
-      for (ResourceItem item : remoteAnnotation.resources()) {
-        if (!item.name().isEmpty()) {
-          resourceMap.put(item.name(), item.value());
-        }
-      }
-    }
-    if (!resourceMap.containsKey(CPU_LITERAL)) {
-      resourceMap.put(CPU_LITERAL, 0.0);
-    }
-    return resourceMap;
-  }
-
-  /**
-   * Convert the resources map to a format string.
-   *
-   * @param resources The resource map to be Converted.
-   * @return The format resources string, like "{CPU:4, GPU:0}".
-   */
-  public static String getResourcesFromatStringFromMap(Map<String, Double> resources) {
-    if (resources == null) {
-      return "{}";
-    }
-    StringBuilder builder = new StringBuilder();
-    builder.append("{");
-    int count = 1;
-    for (Map.Entry<String, Double> entry : resources.entrySet()) {
-      builder.append(entry.getKey()).append(":").append(entry.getValue());
-      count++;
-      if (count != resources.size()) {
-        builder.append(", ");
-      }
-    }
-    builder.append("}");
-    return builder.toString();
-  }
-
   /**
    * Convert resources map to a string that is used
    * for the command line argument of starting raylet.
@@ -99,7 +51,7 @@ public static Map<String, Double> getResourcesMapFromString(String resources)
         String[] resourcePair = trimItem.split(":");
 
         if (resourcePair.length != 2) {
-          throw new IllegalArgumentException("Format of static resurces configure is invalid.");
+          throw new IllegalArgumentException("Format of static resources configure is invalid.");
         }
 
         final String resourceName = resourcePair[0].trim();
diff --git a/java/runtime/src/main/java/org/ray/runtime/util/UniqueIdHelper.java b/java/runtime/src/main/java/org/ray/runtime/util/UniqueIdUtil.java
similarity index 81%
rename from java/runtime/src/main/java/org/ray/runtime/util/UniqueIdHelper.java
rename to java/runtime/src/main/java/org/ray/runtime/util/UniqueIdUtil.java
index 52d9a7359247a..d7b347945792c 100644
--- a/java/runtime/src/main/java/org/ray/runtime/util/UniqueIdHelper.java
+++ b/java/runtime/src/main/java/org/ray/runtime/util/UniqueIdUtil.java
@@ -3,6 +3,8 @@
 import java.nio.ByteBuffer;
 import java.nio.ByteOrder;
 import java.util.Arrays;
+import java.util.List;
+
 import org.ray.api.id.UniqueId;
 
 
@@ -11,7 +13,7 @@
  * Note: any changes to these methods must be synced with C++ helper functions
  * in src/ray/id.h
  */
-public class UniqueIdHelper {
+public class UniqueIdUtil {
   public static final int OBJECT_INDEX_POS = 0;
   public static final int OBJECT_INDEX_LENGTH = 4;
 
@@ -37,7 +39,7 @@ private static UniqueId computeObjectId(UniqueId taskId, int index) {
     System.arraycopy(taskId.getBytes(),0, objId, 0, UniqueId.LENGTH);
     ByteBuffer wbb = ByteBuffer.wrap(objId);
     wbb.order(ByteOrder.LITTLE_ENDIAN);
-    wbb.putInt(UniqueIdHelper.OBJECT_INDEX_POS, index);
+    wbb.putInt(UniqueIdUtil.OBJECT_INDEX_POS, index);
 
     return new UniqueId(objId);
   }
@@ -63,9 +65,18 @@ public static UniqueId computePutId(UniqueId taskId, int putIndex) {
   public static UniqueId computeTaskId(UniqueId objectId) {
     byte[] taskId = new byte[UniqueId.LENGTH];
     System.arraycopy(objectId.getBytes(), 0, taskId, 0, UniqueId.LENGTH);
-    Arrays.fill(taskId, UniqueIdHelper.OBJECT_INDEX_POS,
-        UniqueIdHelper.OBJECT_INDEX_POS + UniqueIdHelper.OBJECT_INDEX_LENGTH, (byte) 0);
+    Arrays.fill(taskId, UniqueIdUtil.OBJECT_INDEX_POS,
+        UniqueIdUtil.OBJECT_INDEX_POS + UniqueIdUtil.OBJECT_INDEX_LENGTH, (byte) 0);
 
     return new UniqueId(taskId);
   }
+
+  public static byte[][] getIdBytes(List<UniqueId> objectIds) {
+    int size = objectIds.size();
+    byte[][] ids = new byte[size][];
+    for (int i = 0; i < size; i++) {
+      ids[i] = objectIds.get(i).getBytes();
+    }
+    return ids;
+  }
 }
diff --git a/java/runtime/src/main/java/org/ray/runtime/util/exception/TaskExecutionException.java b/java/runtime/src/main/java/org/ray/runtime/util/exception/TaskExecutionException.java
deleted file mode 100644
index 99bc0912e1d07..0000000000000
--- a/java/runtime/src/main/java/org/ray/runtime/util/exception/TaskExecutionException.java
+++ /dev/null
@@ -1,15 +0,0 @@
-package org.ray.runtime.util.exception;
-
-/**
- * An exception which is thrown when a ray task encounters an error when executing.
- */
-public class TaskExecutionException extends RuntimeException {
-
-  public TaskExecutionException(Throwable cause) {
-    super(cause);
-  }
-
-  public TaskExecutionException(String message, Throwable cause) {
-    super(message, cause);
-  }
-}
diff --git a/java/runtime/src/main/java/org/ray/runtime/util/generator/RayCallGenerator.java b/java/runtime/src/main/java/org/ray/runtime/util/generator/RayCallGenerator.java
index 10ffc3488f287..82fdf6b7f99e1 100644
--- a/java/runtime/src/main/java/org/ray/runtime/util/generator/RayCallGenerator.java
+++ b/java/runtime/src/main/java/org/ray/runtime/util/generator/RayCallGenerator.java
@@ -21,7 +21,17 @@ private String build() {
     newLine("");
     newLine("package org.ray.api;");
     newLine("");
-    newLine("import org.ray.api.function.*;");
+    newLine("import org.ray.api.function.RayFunc;");
+    newLine("import org.ray.api.function.RayFunc0;");
+    newLine("import org.ray.api.function.RayFunc1;");
+    newLine("import org.ray.api.function.RayFunc2;");
+    newLine("import org.ray.api.function.RayFunc3;");
+    newLine("import org.ray.api.function.RayFunc4;");
+    newLine("import org.ray.api.function.RayFunc5;");
+    newLine("import org.ray.api.function.RayFunc6;");
+    newLine("import org.ray.api.options.ActorCreationOptions;");
+    newLine("import org.ray.api.options.BaseTaskOptions;");
+    newLine("import org.ray.api.options.CallOptions;");
     newLine("");
 
     newLine("/**");
@@ -33,19 +43,21 @@ private String build() {
     newLine(1, "// Methods for remote function invocation.");
     newLine(1, "// =======================================");
     for (int i = 0; i <= MAX_PARAMETERS; i++) {
-      buildCalls(i, false, false);
+      buildCalls(i, false, false, false);
+      buildCalls(i, false, false, true);
     }
     newLine(1, "// ===========================================");
     newLine(1, "// Methods for remote actor method invocation.");
     newLine(1, "// ===========================================");
     for (int i = 0; i <= MAX_PARAMETERS - 1; i++) {
-      buildCalls(i, true, false);
+      buildCalls(i, true, false, false);
     }
     newLine(1, "// ===========================");
     newLine(1, "// Methods for actor creation.");
     newLine(1, "// ===========================");
     for (int i = 0; i <= MAX_PARAMETERS; i++) {
-      buildCalls(i, false, true);
+      buildCalls(i, false, true, false);
+      buildCalls(i, false, true, true);
     }
     newLine("}");
     return sb.toString();
@@ -57,7 +69,8 @@ private String build() {
    * @param forActor build actor api when true, otherwise build task api.
    * @param forActorCreation build `Ray.createActor` when true, otherwise build `Ray.call`.
    */
-  private void buildCalls(int numParameters, boolean forActor, boolean forActorCreation) {
+  private void buildCalls(int numParameters, boolean forActor,
+      boolean forActorCreation, boolean hasOptionsParam) {
     String genericTypes = "";
     String argList = "";
     for (int i = 0; i < numParameters; i++) {
@@ -82,18 +95,36 @@ private void buildCalls(int numParameters, boolean forActor, boolean forActorCre
       paramPrefix += ", ";
     }
 
+    String optionsParam;
+    if (hasOptionsParam) {
+      optionsParam = forActorCreation ? ", ActorCreationOptions options" : ", CallOptions options";
+    } else {
+      optionsParam = "";
+    }
+
+    String optionsArg;
+    if (forActor) {
+      optionsArg = "";
+    } else {
+      if (hasOptionsParam) {
+        optionsArg = ", options";
+      } else {
+        optionsArg = ", null";
+      }
+    }
+
     String returnType = !forActorCreation ? "RayObject<R>" : "RayActor<A>";
     String funcName = !forActorCreation ? "call" : "createActor";
     String funcArgs = !forActor ? "f, args" : "f, actor, args";
     for (String param : generateParameters(0, numParameters)) {
       // method signature
       newLine(1, String.format(
-          "public static <%s> %s %s(%s) {",
-          genericTypes, returnType, funcName, paramPrefix + param
+          "public static <%s> %s %s(%s%s) {",
+          genericTypes, returnType, funcName, paramPrefix + param, optionsParam
       ));
       // method body
       newLine(2, String.format("Object[] args = new Object[]{%s};", argList));
-      newLine(2, String.format("return Ray.internal().%s(%s);", funcName, funcArgs));
+      newLine(2, String.format("return Ray.internal().%s(%s%s);", funcName, funcArgs, optionsArg));
       newLine(1, "}");
     }
   }
diff --git a/java/runtime/src/main/resources/ray.default.conf b/java/runtime/src/main/resources/ray.default.conf
index c20d679a9c598..b45d7dc6376d4 100644
--- a/java/runtime/src/main/resources/ray.default.conf
+++ b/java/runtime/src/main/resources/ray.default.conf
@@ -25,9 +25,16 @@ ray {
   // Available resources on this node, for example "CPU:4,GPU:0".
   resources: ""
 
-  // If worker.mode is DRIVER, specify the driver id.
-  // If not provided, a random id will be used.
-  driver.id: ""
+  // Configuration items about driver.
+  driver {
+    // If worker.mode is DRIVER, specify the driver id.
+    // If not provided, a random id will be used.
+    id: ""
+    // If this config is set, worker will use different paths to loadresources when
+    // executing tasks from different drivers. E.g. if it's set to '/tm/driver_resources',
+    // the path for driver 123 will be '/tmp/driver_resources/123'.
+    resource-path: ""
+  }
 
   // Root dir of log files.
   log-dir: /tmp/ray/logs
@@ -36,6 +43,9 @@ ray {
   // Otherwise, output will be printed to console.
   redirect-output: true
 
+  // Custom worker jvm parameters.
+  worker.jvm-parameters: []
+
   // Custom `java.library.path`
   // Note, do not use `dir1:dir2` format, put each dir as a list item.
   library.path: []
@@ -76,4 +86,5 @@ ray {
     // RPC socket name of Raylet
     socket-name: /tmp/ray/sockets/raylet
   }
+
 }
diff --git a/java/runtime/src/test/java/org/ray/runtime/functionmanager/FunctionManagerTest.java b/java/runtime/src/test/java/org/ray/runtime/functionmanager/FunctionManagerTest.java
index 85f482544c84d..f5ff1e481a36e 100644
--- a/java/runtime/src/test/java/org/ray/runtime/functionmanager/FunctionManagerTest.java
+++ b/java/runtime/src/test/java/org/ray/runtime/functionmanager/FunctionManagerTest.java
@@ -1,5 +1,9 @@
 package org.ray.runtime.functionmanager;
 
+import java.io.File;
+import java.nio.file.Files;
+import java.nio.file.Paths;
+import java.nio.file.StandardCopyOption;
 import java.util.Map;
 import org.apache.commons.lang3.tuple.ImmutablePair;
 import org.apache.commons.lang3.tuple.Pair;
@@ -41,8 +45,6 @@ public Object bar() {
   private static FunctionDescriptor barDescriptor;
   private static FunctionDescriptor barConstructorDescriptor;
 
-  private FunctionManager functionManager;
-
   @BeforeClass
   public static void beforeClass() {
     fooFunc = FunctionManagerTest::foo;
@@ -57,13 +59,9 @@ public static void beforeClass() {
         "()V");
   }
 
-  @Before
-  public void before() {
-    functionManager = new FunctionManager();
-  }
-
   @Test
   public void testGetFunctionFromRayFunc() {
+    final FunctionManager functionManager = new FunctionManager(null);
     // Test normal function.
     RayFunction func = functionManager.getFunction(UniqueId.NIL, fooFunc);
     Assert.assertFalse(func.isConstructor());
@@ -74,7 +72,7 @@ public void testGetFunctionFromRayFunc() {
     func = functionManager.getFunction(UniqueId.NIL, barFunc);
     Assert.assertFalse(func.isConstructor());
     Assert.assertEquals(func.getFunctionDescriptor(), barDescriptor);
-    Assert.assertNotNull(func.getRayRemoteAnnotation());
+    Assert.assertNull(func.getRayRemoteAnnotation());
 
     // Test actor constructor
     func = functionManager.getFunction(UniqueId.NIL, barConstructor);
@@ -85,6 +83,7 @@ public void testGetFunctionFromRayFunc() {
 
   @Test
   public void testGetFunctionFromFunctionDescriptor() {
+    final FunctionManager functionManager = new FunctionManager(null);
     // Test normal function.
     RayFunction func = functionManager.getFunction(UniqueId.NIL, fooDescriptor);
     Assert.assertFalse(func.isConstructor());
@@ -95,7 +94,7 @@ public void testGetFunctionFromFunctionDescriptor() {
     func = functionManager.getFunction(UniqueId.NIL, barDescriptor);
     Assert.assertFalse(func.isConstructor());
     Assert.assertEquals(func.getFunctionDescriptor(), barDescriptor);
-    Assert.assertNotNull(func.getRayRemoteAnnotation());
+    Assert.assertNull(func.getRayRemoteAnnotation());
 
     // Test actor constructor
     func = functionManager.getFunction(UniqueId.NIL, barConstructorDescriptor);
@@ -116,4 +115,28 @@ public void testLoadFunctionTableForClass() {
     Assert.assertTrue(res.containsKey(
         ImmutablePair.of(barConstructorDescriptor.name, barConstructorDescriptor.typeDescriptor)));
   }
+
+  //TODO(qwang): This is an integration test case, and we should move it to test folder in the future.
+  @Test
+  public void testGetFunctionFromLocalResource() throws Exception{
+    UniqueId driverId = UniqueId.fromHexString("0123456789012345678901234567890123456789");
+
+    //TODO(qwang): We should use a independent app demo instead of `tutorial`.
+    final String resourcePath = "/tmp/ray/test/resource";
+    final String srcJarPath = System.getProperty("user.dir") +
+                                  "/../tutorial/target/ray-tutorial-0.1-SNAPSHOT.jar";
+    final String destJarPath = resourcePath + "/" + driverId.toString() +
+                                   "/ray-tutorial-0.1-SNAPSHOT.jar";
+
+    File file = new File(resourcePath + "/" + driverId.toString());
+    file.mkdirs();
+    Files.copy(Paths.get(srcJarPath), Paths.get(destJarPath), StandardCopyOption.REPLACE_EXISTING);
+
+    final FunctionManager functionManager = new FunctionManager(resourcePath);
+    FunctionDescriptor sayHelloDescriptor = new FunctionDescriptor("org.ray.exercise.Exercise02",
+        "sayHello", "()Ljava/lang/String;");
+    RayFunction func = functionManager.getFunction(driverId, sayHelloDescriptor);
+    Assert.assertEquals(func.getFunctionDescriptor(), sayHelloDescriptor);
+  }
+
 }
diff --git a/java/test/src/main/java/org/ray/api/test/RayConfigTest.java b/java/test/src/main/java/org/ray/api/test/RayConfigTest.java
index fd47e15ab494b..71e3d0dfff8e7 100644
--- a/java/test/src/main/java/org/ray/api/test/RayConfigTest.java
+++ b/java/test/src/main/java/org/ray/api/test/RayConfigTest.java
@@ -11,6 +11,7 @@ public class RayConfigTest {
   @Test
   public void testCreateRayConfig() {
     System.setProperty("ray.home", "/path/to/ray");
+    System.setProperty("ray.driver.resource-path", "path/to/ray/driver/resource/path");
     RayConfig rayConfig = RayConfig.create();
 
     Assert.assertEquals("/path/to/ray", rayConfig.rayHome);
@@ -19,8 +20,12 @@ public void testCreateRayConfig() {
 
     System.setProperty("ray.home", "");
     rayConfig = RayConfig.create();
+
     Assert.assertEquals(System.getProperty("user.dir"), rayConfig.rayHome);
     Assert.assertEquals(System.getProperty("user.dir") +
-        "/build/src/common/thirdparty/redis/src/redis-server", rayConfig.redisServerExecutablePath);
+        "/build/src/ray/thirdparty/redis/src/redis-server", rayConfig.redisServerExecutablePath);
+
+    Assert.assertEquals("path/to/ray/driver/resource/path", rayConfig.driverResourcePath);
+
   }
 }
diff --git a/java/test/src/main/java/org/ray/api/test/ResourcesManagementTest.java b/java/test/src/main/java/org/ray/api/test/ResourcesManagementTest.java
index 001723fec4bf6..e185a5f19a894 100644
--- a/java/test/src/main/java/org/ray/api/test/ResourcesManagementTest.java
+++ b/java/test/src/main/java/org/ray/api/test/ResourcesManagementTest.java
@@ -1,6 +1,8 @@
 package org.ray.api.test;
 
 import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
+import jdk.nashorn.internal.ir.annotations.Immutable;
 import org.junit.Assert;
 import org.junit.Test;
 import org.junit.runner.RunWith;
@@ -9,7 +11,8 @@
 import org.ray.api.RayObject;
 import org.ray.api.WaitResult;
 import org.ray.api.annotation.RayRemote;
-import org.ray.api.annotation.ResourceItem;
+import org.ray.api.options.ActorCreationOptions;
+import org.ray.api.options.CallOptions;
 
 /**
  * Resources Management Test.
@@ -17,29 +20,13 @@
 @RunWith(MyRunner.class)
 public class ResourcesManagementTest {
 
-  @RayRemote(resources = {@ResourceItem(name = "CPU", value = 4),
-      @ResourceItem(name = "GPU", value = 0)})
-  public static Integer echo1(Integer number) {
+  @RayRemote
+  public static Integer echo(Integer number) {
     return number;
   }
 
-  @RayRemote(resources = {@ResourceItem(name = "CPU", value = 4),
-      @ResourceItem(name = "GPU", value = 2)})
-  public static Integer echo2(Integer number) {
-    return number;
-  }
-
-  @RayRemote(resources = {@ResourceItem(name = "CPU", value = 2),
-      @ResourceItem(name = "GPU", value = 0)})
-  public static class Echo1 {
-    public Integer echo(Integer number) {
-      return number;
-    }
-  }
-
-  @RayRemote(resources = {@ResourceItem(name = "CPU", value = 8),
-      @ResourceItem(name = "GPU", value = 0)})
-  public static class Echo2 {
+  @RayRemote
+  public static class Echo {
     public Integer echo(Integer number) {
       return number;
     }
@@ -47,12 +34,18 @@ public Integer echo(Integer number) {
 
   @Test
   public void testMethods() {
+    CallOptions callOptions1 = new CallOptions(ImmutableMap.of("CPU", 4.0, "GPU", 0.0));
+
     // This is a case that can satisfy required resources.
-    RayObject<Integer> result1 = Ray.call(ResourcesManagementTest::echo1, 100);
+    // The static resources for test are "CPU:4,RES-A:4".
+    RayObject<Integer> result1 = Ray.call(ResourcesManagementTest::echo, 100, callOptions1);
     Assert.assertEquals(100, (int) result1.get());
 
+    CallOptions callOptions2 = new CallOptions(ImmutableMap.of("CPU", 4.0, "GPU", 2.0));
+
     // This is a case that can't satisfy required resources.
-    final RayObject<Integer> result2 = Ray.call(ResourcesManagementTest::echo2, 200);
+    // The static resources for test are "CPU:4,RES-A:4".
+    final RayObject<Integer> result2 = Ray.call(ResourcesManagementTest::echo, 200, callOptions2);
     WaitResult<Integer> waitResult = Ray.wait(ImmutableList.of(result2), 1, 1000);
 
     Assert.assertEquals(0, waitResult.getReady().size());
@@ -61,14 +54,24 @@ public void testMethods() {
 
   @Test
   public void testActors() {
+
+    ActorCreationOptions actorCreationOptions1 =
+        new ActorCreationOptions(ImmutableMap.of("CPU", 2.0, "GPU", 0.0));
+
     // This is a case that can satisfy required resources.
-    RayActor<ResourcesManagementTest.Echo1> echo1 = Ray.createActor(Echo1::new);
-    final RayObject<Integer> result1 = Ray.call(Echo1::echo, echo1, 100);
+    // The static resources for test are "CPU:4,RES-A:4".
+    RayActor<Echo> echo1 = Ray.createActor(Echo::new, actorCreationOptions1);
+    final RayObject<Integer> result1 = Ray.call(Echo::echo, echo1, 100);
     Assert.assertEquals(100, (int) result1.get());
 
     // This is a case that can't satisfy required resources.
-    RayActor<ResourcesManagementTest.Echo2> echo2 = Ray.createActor(Echo2::new);
-    final RayObject<Integer> result2 = Ray.call(Echo2::echo, echo2, 100);
+    // The static resources for test are "CPU:4,RES-A:4".
+    ActorCreationOptions actorCreationOptions2 =
+        new ActorCreationOptions(ImmutableMap.of("CPU", 8.0, "GPU", 0.0));
+
+    RayActor<ResourcesManagementTest.Echo> echo2 =
+        Ray.createActor(Echo::new, actorCreationOptions2);
+    final RayObject<Integer> result2 = Ray.call(Echo::echo, echo2, 100);
     WaitResult<Integer> waitResult = Ray.wait(ImmutableList.of(result2), 1, 1000);
 
     Assert.assertEquals(0, waitResult.getReady().size());
diff --git a/java/test/src/main/java/org/ray/api/test/StressTest.java b/java/test/src/main/java/org/ray/api/test/StressTest.java
new file mode 100644
index 0000000000000..4fab74aed1991
--- /dev/null
+++ b/java/test/src/main/java/org/ray/api/test/StressTest.java
@@ -0,0 +1,98 @@
+package org.ray.api.test;
+
+import com.google.common.collect.ImmutableList;
+import java.util.ArrayList;
+import java.util.List;
+import org.junit.Assert;
+import org.junit.Test;
+import org.junit.runner.RunWith;
+import org.ray.api.Ray;
+import org.ray.api.RayActor;
+import org.ray.api.RayObject;
+import org.ray.api.id.UniqueId;
+
+@RunWith(MyRunner.class)
+public class StressTest {
+
+  public static int echo(int x) {
+    return x;
+  }
+
+  @Test
+  public void testSubmittingTasks() {
+    for (int numIterations : ImmutableList.of(1, 10, 100, 1000)) {
+      int numTasks = 1000 / numIterations;
+      for (int i = 0; i < numIterations; i++) {
+        List<UniqueId> resultIds = new ArrayList<>();
+        for (int j = 0; j < numTasks; j++) {
+          resultIds.add(Ray.call(StressTest::echo, 1).getId());
+        }
+        for (Integer result : Ray.<Integer>get(resultIds)) {
+          Assert.assertEquals(result, Integer.valueOf(1));
+        }
+      }
+    }
+  }
+
+  @Test
+  public void testDependency() {
+    RayObject<Integer> x = Ray.call(StressTest::echo, 1);
+    for (int i = 0; i < 1000; i++) {
+      x = Ray.call(StressTest::echo, x);
+    }
+    Assert.assertEquals(x.get(), Integer.valueOf(1));
+  }
+
+  public static class Actor {
+
+    public int ping() {
+      return 1;
+    }
+  }
+
+  public static class Worker {
+
+    private RayActor<Actor> actor;
+
+    public Worker(RayActor<Actor> actor) {
+      this.actor = actor;
+    }
+
+    public int ping(int n) {
+      List<UniqueId> objectIds = new ArrayList<>();
+      for (int i = 0; i < n; i++) {
+        objectIds.add(Ray.call(Actor::ping, actor).getId());
+      }
+      int sum = 0;
+      for (Integer result : Ray.<Integer>get(objectIds)) {
+        sum += result;
+      }
+      return sum;
+    }
+  }
+
+  @Test
+  public void testSubmittingManyTasksToOneActor() {
+    RayActor<Actor> actor = Ray.createActor(Actor::new);
+    List<UniqueId> objectIds = new ArrayList<>();
+    for (int i = 0; i < 10; i++) {
+      RayActor<Worker> worker = Ray.createActor(Worker::new, actor);
+      objectIds.add(Ray.call(Worker::ping, worker, 100).getId());
+    }
+    for (Integer result : Ray.<Integer>get(objectIds)) {
+      Assert.assertEquals(result, Integer.valueOf(100));
+    }
+  }
+
+  @Test
+  public void testPuttingAndGettingManyObjects() {
+    Integer objectToPut = 1;
+    List<RayObject<Integer>> objects = new ArrayList<>();
+    for (int i = 0; i < 100_000; i++) {
+      objects.add(Ray.put(objectToPut));
+    }
+    for (RayObject<Integer> object : objects) {
+      Assert.assertEquals(object.get(), objectToPut);
+    }
+  }
+}
diff --git a/java/test/src/main/java/org/ray/api/test/TestListener.java b/java/test/src/main/java/org/ray/api/test/TestListener.java
index 3fb16bf4f379f..efc419b34720e 100644
--- a/java/test/src/main/java/org/ray/api/test/TestListener.java
+++ b/java/test/src/main/java/org/ray/api/test/TestListener.java
@@ -10,7 +10,7 @@ public class TestListener extends RunListener {
   @Override
   public void testRunStarted(Description description) {
     System.setProperty("ray.home", "../..");
-    System.setProperty("ray.resources", "CPU:4");
+    System.setProperty("ray.resources", "CPU:4,RES-A:4");
     Ray.init();
   }
 
diff --git a/java/test/src/main/java/org/ray/api/test/UniqueIdTest.java b/java/test/src/main/java/org/ray/api/test/UniqueIdTest.java
index 0a21fc2872bf3..2fd47057d90de 100644
--- a/java/test/src/main/java/org/ray/api/test/UniqueIdTest.java
+++ b/java/test/src/main/java/org/ray/api/test/UniqueIdTest.java
@@ -5,18 +5,16 @@
 import javax.xml.bind.DatatypeConverter;
 import org.junit.Assert;
 import org.junit.Test;
-import org.junit.runner.RunWith;
 import org.ray.api.id.UniqueId;
-import org.ray.runtime.util.UniqueIdHelper;
+import org.ray.runtime.util.UniqueIdUtil;
 
-@RunWith(MyRunner.class)
 public class UniqueIdTest {
 
   @Test
   public void testConstructUniqueId() {
     // Test `fromHexString()`
     UniqueId id1 = UniqueId.fromHexString("00000000123456789ABCDEF123456789ABCDEF00");
-    Assert.assertEquals("00000000123456789ABCDEF123456789ABCDEF00", id1.toString());
+    Assert.assertEquals("00000000123456789abcdef123456789abcdef00", id1.toString());
     Assert.assertFalse(id1.isNil());
 
     try {
@@ -40,12 +38,12 @@ public void testConstructUniqueId() {
     ByteBuffer byteBuffer = ByteBuffer.wrap(bytes, 0, 20);
     UniqueId id4 = UniqueId.fromByteBuffer(byteBuffer);
     Assert.assertTrue(Arrays.equals(bytes, id4.getBytes()));
-    Assert.assertEquals("0123456789ABCDEF0123456789ABCDEF01234567", id4.toString());
+    Assert.assertEquals("0123456789abcdef0123456789abcdef01234567", id4.toString());
 
 
     // Test `genNil()`
     UniqueId id6 = UniqueId.genNil();
-    Assert.assertEquals("FFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFF", id6.toString());
+    Assert.assertEquals("FFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFFF".toLowerCase(), id6.toString());
     Assert.assertTrue(id6.isNil());
   }
 
@@ -54,19 +52,19 @@ public void testComputeReturnId() {
     // Mock a taskId, and the lowest 4 bytes should be 0.
     UniqueId taskId = UniqueId.fromHexString("00000000123456789ABCDEF123456789ABCDEF00");
 
-    UniqueId returnId = UniqueIdHelper.computeReturnId(taskId, 1);
-    Assert.assertEquals("01000000123456789ABCDEF123456789ABCDEF00", returnId.toString());
+    UniqueId returnId = UniqueIdUtil.computeReturnId(taskId, 1);
+    Assert.assertEquals("01000000123456789abcdef123456789abcdef00", returnId.toString());
 
-    returnId = UniqueIdHelper.computeReturnId(taskId, 0x01020304);
-    Assert.assertEquals("04030201123456789ABCDEF123456789ABCDEF00", returnId.toString());
+    returnId = UniqueIdUtil.computeReturnId(taskId, 0x01020304);
+    Assert.assertEquals("04030201123456789abcdef123456789abcdef00", returnId.toString());
   }
 
   @Test
   public void testComputeTaskId() {
     UniqueId objId = UniqueId.fromHexString("34421980123456789ABCDEF123456789ABCDEF00");
-    UniqueId taskId = UniqueIdHelper.computeTaskId(objId);
+    UniqueId taskId = UniqueIdUtil.computeTaskId(objId);
 
-    Assert.assertEquals("00000000123456789ABCDEF123456789ABCDEF00", taskId.toString());
+    Assert.assertEquals("00000000123456789abcdef123456789abcdef00", taskId.toString());
   }
 
   @Test
@@ -74,11 +72,11 @@ public void testComputePutId() {
     // Mock a taskId, the lowest 4 bytes should be 0.
     UniqueId taskId = UniqueId.fromHexString("00000000123456789ABCDEF123456789ABCDEF00");
 
-    UniqueId putId = UniqueIdHelper.computePutId(taskId, 1);
-    Assert.assertEquals("FFFFFFFF123456789ABCDEF123456789ABCDEF00", putId.toString());
+    UniqueId putId = UniqueIdUtil.computePutId(taskId, 1);
+    Assert.assertEquals("FFFFFFFF123456789ABCDEF123456789ABCDEF00".toLowerCase(), putId.toString());
 
-    putId = UniqueIdHelper.computePutId(taskId, 0x01020304);
-    Assert.assertEquals("FCFCFDFE123456789ABCDEF123456789ABCDEF00", putId.toString());
+    putId = UniqueIdUtil.computePutId(taskId, 0x01020304);
+    Assert.assertEquals("FCFCFDFE123456789ABCDEF123456789ABCDEF00".toLowerCase(), putId.toString());
   }
 
 }
diff --git a/java/tutorial/pom.xml b/java/tutorial/pom.xml
index 198f6f0a3a51e..48a03dc1ca8e1 100644
--- a/java/tutorial/pom.xml
+++ b/java/tutorial/pom.xml
@@ -40,7 +40,7 @@
             <RAY_CONFIG>${basedir}/../ray.config.ini</RAY_CONFIG>
           </environmentVariables>
           <argLine>-ea
-            -Djava.library.path=${basedir}/../../build/src/plasma:${basedir}/../../build/src/local_scheduler
+            -Djava.library.path=${basedir}/../../build/src/plasma:${basedir}/../../build/src/ray/raylet
             -noverify
             -DlogOutput=console
           </argLine>
diff --git a/python/benchmarks/benchmark_actor.py b/python/benchmarks/benchmark_actor.py
index b0450c14de6a6..2eb476e1f172f 100644
--- a/python/benchmarks/benchmark_actor.py
+++ b/python/benchmarks/benchmark_actor.py
@@ -9,7 +9,7 @@
 
 def setup():
     if not hasattr(setup, "is_initialized"):
-        ray.init(num_workers=NUM_WORKERS, num_cpus=4)
+        ray.init(num_cpus=4)
         setup.is_initialized = True
 
 
diff --git a/python/benchmarks/benchmark_get.py b/python/benchmarks/benchmark_get.py
index 27a848e9cf3c6..fccfc00e0f709 100644
--- a/python/benchmarks/benchmark_get.py
+++ b/python/benchmarks/benchmark_get.py
@@ -9,7 +9,7 @@
 
 def setup():
     if not hasattr(setup, "is_initialized"):
-        ray.init(num_workers=4, num_cpus=4)
+        ray.init(num_cpus=4)
         setup.is_initialized = True
 
 
diff --git a/python/benchmarks/benchmark_put.py b/python/benchmarks/benchmark_put.py
index 986a28c89f283..e74bf099666ac 100644
--- a/python/benchmarks/benchmark_put.py
+++ b/python/benchmarks/benchmark_put.py
@@ -9,7 +9,7 @@
 
 def setup():
     if not hasattr(setup, "is_initialized"):
-        ray.init(num_workers=4, num_cpus=4)
+        ray.init(num_cpus=0)
         setup.is_initialized = True
 
 
diff --git a/python/benchmarks/benchmark_queue.py b/python/benchmarks/benchmark_queue.py
index bc4ec6a41ee5d..fd8a4a6eb13a8 100644
--- a/python/benchmarks/benchmark_queue.py
+++ b/python/benchmarks/benchmark_queue.py
@@ -8,7 +8,7 @@
 
 def setup():
     if not hasattr(setup, "is_initialized"):
-        ray.init(num_workers=4, num_cpus=4)
+        ray.init(num_cpus=4)
         setup.is_initialized = True
 
 
diff --git a/python/benchmarks/benchmark_task.py b/python/benchmarks/benchmark_task.py
index 30a4bb8cb1f23..b454f63277fc5 100644
--- a/python/benchmarks/benchmark_task.py
+++ b/python/benchmarks/benchmark_task.py
@@ -7,7 +7,7 @@
 
 def setup():
     if not hasattr(setup, "is_initialized"):
-        ray.init(num_workers=10, num_cpus=10, resources={"foo": 1})
+        ray.init(num_cpus=10, resources={"foo": 1})
         setup.is_initialized = True
 
 
diff --git a/python/benchmarks/benchmark_wait.py b/python/benchmarks/benchmark_wait.py
index b40c0463a6cbe..614d76a38c54f 100644
--- a/python/benchmarks/benchmark_wait.py
+++ b/python/benchmarks/benchmark_wait.py
@@ -9,7 +9,7 @@
 
 def setup(*args):
     if not hasattr(setup, "is_initialized"):
-        ray.init(num_workers=4, num_cpus=4)
+        ray.init(num_cpus=4)
         setup.is_initialized = True
 
 
diff --git a/python/benchmarks/benchmarks.py b/python/benchmarks/benchmarks.py
index 6eac996a48a55..c286e1ef6ec0f 100644
--- a/python/benchmarks/benchmarks.py
+++ b/python/benchmarks/benchmarks.py
@@ -7,7 +7,7 @@
 
 def setup():
     if not hasattr(setup, "is_initialized"):
-        ray.init(num_workers=4, num_cpus=4)
+        ray.init(num_cpus=4)
         setup.is_initialized = True
 
 
diff --git a/python/build-wheel-macos.sh b/python/build-wheel-macos.sh
index 588362e8099e2..30e8b19363769 100755
--- a/python/build-wheel-macos.sh
+++ b/python/build-wheel-macos.sh
@@ -16,15 +16,24 @@ DOWNLOAD_DIR=python_downloads
 PY_VERSIONS=("2.7.13"
              "3.4.4"
              "3.5.3"
-             "3.6.1")
+             "3.6.1"
+             "3.7.0")
 PY_INSTS=("python-2.7.13-macosx10.6.pkg"
           "python-3.4.4-macosx10.6.pkg"
           "python-3.5.3-macosx10.6.pkg"
-          "python-3.6.1-macosx10.6.pkg")
+          "python-3.6.1-macosx10.6.pkg"
+          "python-3.7.0-macosx10.6.pkg")
 PY_MMS=("2.7"
         "3.4"
         "3.5"
-        "3.6")
+        "3.6"
+        "3.7")
+# On python 3.7, a newer version of numpy seems to be necessary.
+NUMPY_VERSIONS=("1.10.4"
+                "1.10.4"
+                "1.10.4"
+                "1.10.4"
+                "1.14.5")
 
 mkdir -p $DOWNLOAD_DIR
 mkdir -p .whl
@@ -33,6 +42,7 @@ for ((i=0; i<${#PY_VERSIONS[@]}; ++i)); do
   PY_VERSION=${PY_VERSIONS[i]}
   PY_INST=${PY_INSTS[i]}
   PY_MM=${PY_MMS[i]}
+  NUMPY_VERSION=${NUMPY_VERSIONS[i]}
 
   # The -f flag is passed twice to also run git clean in the arrow subdirectory.
   # The -d flag removes directories. The -x flag ignores the .gitignore file,
@@ -60,7 +70,7 @@ for ((i=0; i<${#PY_VERSIONS[@]}; ++i)); do
     $PIP_CMD install -q setuptools_scm==2.1.0
     # Fix the numpy version because this will be the oldest numpy version we can
     # support.
-    $PIP_CMD install -q numpy==1.10.4 cython==0.27.3
+    $PIP_CMD install -q numpy==$NUMPY_VERSION cython==0.27.3
     # Install wheel to avoid the error "invalid command 'bdist_wheel'".
     $PIP_CMD install -q wheel
     # Add the correct Python to the path and build the wheel. This is only
diff --git a/python/build-wheel-manylinux1.sh b/python/build-wheel-manylinux1.sh
index 8fdee4a1a480e..db31ff55a4e6e 100755
--- a/python/build-wheel-manylinux1.sh
+++ b/python/build-wheel-manylinux1.sh
@@ -13,7 +13,7 @@ rm -f /usr/bin/python2
 ln -s /opt/python/cp27-cp27m/bin/python2 /usr/bin/python2
 
 mkdir .whl
-for PYTHON in cp27-cp27mu cp34-cp34m cp35-cp35m cp36-cp36m; do
+for PYTHON in cp27-cp27mu cp34-cp34m cp35-cp35m cp36-cp36m cp37-cp37m; do
   # The -f flag is passed twice to also run git clean in the arrow subdirectory.
   # The -d flag removes directories. The -x flag ignores the .gitignore file,
   # and the -e flag ensures that we don't remove the .whl directory.
diff --git a/python/ray/WebUI.ipynb b/python/ray/WebUI.ipynb
index 390263827e037..229366eba10b6 100644
--- a/python/ray/WebUI.ipynb
+++ b/python/ray/WebUI.ipynb
@@ -1,150 +1,97 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Ray UI\n",
-    "\n",
-    "Start the UI with **Kernel -> Restart and Run All**."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "import ray\n",
-    "import ray.experimental.ui as ui\n",
-    "\n",
-    "ray.init(redis_address=os.environ[\"REDIS_ADDRESS\"])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### Object search."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.object_search_bar()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### Task search."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.task_search_bar()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### Task trace timeline."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "To view arrows, go to View Options and select Flow Events."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.task_timeline()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### Task durations."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.task_completion_time_distribution()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### CPU usage."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.cpu_usage()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### Cluster usage."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ui.cluster_usage()"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.6.1"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+    "cells": [{
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": [
+            "# Ray UI\n", "\n",
+            "Start the UI with **Kernel -> Restart and Run All**."
+        ]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": [
+            "import os\n", "import ray\n",
+            "import ray.experimental.ui as ui\n", "\n",
+            "ray.init(redis_address=os.environ[\"REDIS_ADDRESS\"])"
+        ]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": ["#### Task trace timeline."]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": [
+            "To view arrows, go to View Options and select Flow Events."
+        ]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": ["ui.task_timeline()"]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": ["#### Object transfer timeline."]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": ["ui.object_transfer_timeline()"]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": ["#### Task durations."]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": ["ui.task_completion_time_distribution()"]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": ["#### CPU usage."]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": ["ui.cpu_usage()"]
+    }, {
+        "cell_type": "markdown",
+        "metadata": {},
+        "source": ["#### Cluster usage."]
+    }, {
+        "cell_type": "code",
+        "execution_count": null,
+        "metadata": {},
+        "outputs": [],
+        "source": ["ui.cluster_usage()"]
+    }],
+    "metadata": {
+        "kernelspec": {
+            "display_name": "Python 3",
+            "language": "python",
+            "name": "python3"
+        },
+        "language_info": {
+            "codemirror_mode": {
+                "name": "ipython",
+                "version": 3
+            },
+            "file_extension": ".py",
+            "mimetype": "text/x-python",
+            "name": "python",
+            "nbconvert_exporter": "python",
+            "pygments_lexer": "ipython3",
+            "version": "3.6.1"
+        }
+    },
+    "nbformat": 4,
+    "nbformat_minor": 2
 }
diff --git a/python/ray/__init__.py b/python/ray/__init__.py
index b97af4b587daa..ed024a107aa50 100644
--- a/python/ray/__init__.py
+++ b/python/ray/__init__.py
@@ -46,7 +46,10 @@
             e.args += (helpful_message, )
     raise
 
-from ray.local_scheduler import ObjectID, _config  # noqa: E402
+modin_path = os.path.join(os.path.abspath(os.path.dirname(__file__)), "modin")
+sys.path.insert(0, modin_path)
+
+from ray.raylet import ObjectID, _config  # noqa: E402
 from ray.profiling import profile  # noqa: E402
 from ray.worker import (error_info, init, connect, disconnect, get, put, wait,
                         remote, get_gpu_ids, get_resource_ids, get_webui_url,
@@ -61,9 +64,8 @@
 import ray.actor  # noqa: F401
 from ray.actor import method  # noqa: E402
 
-# Ray version string. TODO(rkn): This is also defined separately in setup.py.
-# Fix this.
-__version__ = "0.5.3"
+# Ray version string.
+__version__ = "0.6.0"
 
 __all__ = [
     "error_info", "init", "connect", "disconnect", "get", "put", "wait",
diff --git a/python/ray/actor.py b/python/ray/actor.py
index 3886e1927a02f..926f15b293644 100644
--- a/python/ray/actor.py
+++ b/python/ray/actor.py
@@ -5,29 +5,21 @@
 import copy
 import hashlib
 import inspect
-import json
+import logging
+import sys
 import traceback
 
 import ray.cloudpickle as pickle
-import ray.local_scheduler
+from ray.function_manager import FunctionActorManager
+import ray.raylet
 import ray.ray_constants as ray_constants
 import ray.signature as signature
 import ray.worker
-from ray.utils import (
-    decode,
-    _random_string,
-    check_oversized_pickle,
-    is_cython,
-    push_error_to_driver,
-)
+from ray.utils import _random_string
 
 DEFAULT_ACTOR_METHOD_NUM_RETURN_VALS = 1
 
-
-def is_classmethod(f):
-    """Returns whether the given method is a classmethod."""
-
-    return hasattr(f, "__self__") and f.__self__ is not None
+logger = logging.getLogger(__name__)
 
 
 def compute_actor_handle_id(actor_handle_id, num_forks):
@@ -96,24 +88,6 @@ def compute_actor_creation_function_id(class_id):
     return ray.ObjectID(class_id)
 
 
-def compute_actor_method_function_id(class_name, attr):
-    """Get the function ID corresponding to an actor method.
-
-    Args:
-        class_name (str): The class name of the actor.
-        attr (str): The attribute name of the method.
-
-    Returns:
-        Function ID corresponding to the method.
-    """
-    function_id_hash = hashlib.sha1()
-    function_id_hash.update(class_name.encode("ascii"))
-    function_id_hash.update(attr.encode("ascii"))
-    function_id = function_id_hash.digest()
-    assert len(function_id) == ray_constants.ID_SIZE
-    return ray.ObjectID(function_id)
-
-
 def set_actor_checkpoint(worker, actor_id, checkpoint_index, checkpoint,
                          frontier):
     """Set the most recent checkpoint associated with a given actor ID.
@@ -134,28 +108,6 @@ def set_actor_checkpoint(worker, actor_id, checkpoint_index, checkpoint,
         })
 
 
-def get_actor_checkpoint(worker, actor_id):
-    """Get the most recent checkpoint associated with a given actor ID.
-
-    Args:
-        worker: The worker to use to get the checkpoint.
-        actor_id: The actor ID of the actor to get the checkpoint for.
-
-    Returns:
-        If a checkpoint exists, this returns a tuple of the number of tasks
-            included in the checkpoint, the saved checkpoint state, and the
-            task frontier at the time of the checkpoint. If no checkpoint
-            exists, all objects are set to None.  The checkpoint index is the .
-            executed on the actor before the checkpoint was made.
-    """
-    actor_key = b"Actor:" + actor_id
-    checkpoint_index, checkpoint, frontier = worker.redis_client.hmget(
-        actor_key, ["checkpoint_index", "checkpoint", "frontier"])
-    if checkpoint_index is not None:
-        checkpoint_index = int(checkpoint_index)
-    return checkpoint_index, checkpoint, frontier
-
-
 def save_and_log_checkpoint(worker, actor):
     """Save a checkpoint on the actor and log any errors.
 
@@ -205,219 +157,26 @@ def restore_and_log_checkpoint(worker, actor):
     return checkpoint_resumed
 
 
-def make_actor_method_executor(worker, method_name, method, actor_imported):
-    """Make an executor that wraps a user-defined actor method.
-
-    The wrapped method updates the worker's internal state and performs any
-    necessary checkpointing operations.
+def get_actor_checkpoint(worker, actor_id):
+    """Get the most recent checkpoint associated with a given actor ID.
 
     Args:
-        worker (Worker): The worker that is executing the actor.
-        method_name (str): The name of the actor method.
-        method (instancemethod): The actor method to wrap. This should be a
-            method defined on the actor class and should therefore take an
-            instance of the actor as the first argument.
-        actor_imported (bool): Whether the actor has been imported.
-            Checkpointing operations will not be run if this is set to False.
+        worker: The worker to use to get the checkpoint.
+        actor_id: The actor ID of the actor to get the checkpoint for.
 
     Returns:
-        A function that executes the given actor method on the worker's stored
-            instance of the actor. The function also updates the worker's
-            internal state to record the executed method.
-    """
-
-    def actor_method_executor(dummy_return_id, actor, *args):
-        # Update the actor's task counter to reflect the task we're about to
-        # execute.
-        worker.actor_task_counter += 1
-
-        # If this is the first task to execute on the actor, try to resume from
-        # a checkpoint.
-        if actor_imported and worker.actor_task_counter == 1:
-            checkpoint_resumed = restore_and_log_checkpoint(worker, actor)
-            if checkpoint_resumed:
-                # NOTE(swang): Since we did not actually execute the __init__
-                # method, this will put None as the return value. If the
-                # __init__ method is supposed to return multiple values, an
-                # exception will be logged.
-                return
-
-        # Determine whether we should checkpoint the actor.
-        checkpointing_on = (actor_imported
-                            and worker.actor_checkpoint_interval > 0)
-        # We should checkpoint the actor if user checkpointing is on, we've
-        # executed checkpoint_interval tasks since the last checkpoint, and the
-        # method we're about to execute is not a checkpoint.
-        save_checkpoint = (
-            checkpointing_on and
-            (worker.actor_task_counter % worker.actor_checkpoint_interval == 0
-             and method_name != "__ray_checkpoint__"))
-
-        # Execute the assigned method and save a checkpoint if necessary.
-        try:
-            if is_classmethod(method):
-                method_returns = method(*args)
-            else:
-                method_returns = method(actor, *args)
-        except Exception:
-            # Save the checkpoint before allowing the method exception to be
-            # thrown.
-            if save_checkpoint:
-                save_and_log_checkpoint(worker, actor)
-            raise
-        else:
-            # Save the checkpoint before returning the method's return values.
-            if save_checkpoint:
-                save_and_log_checkpoint(worker, actor)
-            return method_returns
-
-    return actor_method_executor
-
-
-def fetch_and_register_actor(actor_class_key, worker):
-    """Import an actor.
-
-    This will be called by the worker's import thread when the worker receives
-    the actor_class export, assuming that the worker is an actor for that
-    class.
-
-    Args:
-        actor_class_key: The key in Redis to use to fetch the actor.
-        worker: The worker to use.
-    """
-    actor_id_str = worker.actor_id
-    (driver_id, class_id, class_name, module, pickled_class,
-     checkpoint_interval, actor_method_names) = worker.redis_client.hmget(
-         actor_class_key, [
-             "driver_id", "class_id", "class_name", "module", "class",
-             "checkpoint_interval", "actor_method_names"
-         ])
-
-    class_name = decode(class_name)
-    module = decode(module)
-    checkpoint_interval = int(checkpoint_interval)
-    actor_method_names = json.loads(decode(actor_method_names))
-
-    # Create a temporary actor with some temporary methods so that if the actor
-    # fails to be unpickled, the temporary actor can be used (just to produce
-    # error messages and to prevent the driver from hanging).
-    class TemporaryActor(object):
-        pass
-
-    worker.actors[actor_id_str] = TemporaryActor()
-    worker.actor_checkpoint_interval = checkpoint_interval
-
-    def temporary_actor_method(*xs):
-        raise Exception("The actor with name {} failed to be imported, and so "
-                        "cannot execute this method".format(class_name))
-
-    # Register the actor method executors.
-    for actor_method_name in actor_method_names:
-        function_id = compute_actor_method_function_id(class_name,
-                                                       actor_method_name).id()
-        temporary_executor = make_actor_method_executor(
-            worker,
-            actor_method_name,
-            temporary_actor_method,
-            actor_imported=False)
-        worker.function_execution_info[driver_id][function_id] = (
-            ray.worker.FunctionExecutionInfo(
-                function=temporary_executor,
-                function_name=actor_method_name,
-                max_calls=0))
-        worker.num_task_executions[driver_id][function_id] = 0
-
-    try:
-        unpickled_class = pickle.loads(pickled_class)
-        worker.actor_class = unpickled_class
-    except Exception:
-        # If an exception was thrown when the actor was imported, we record the
-        # traceback and notify the scheduler of the failure.
-        traceback_str = ray.utils.format_error_message(traceback.format_exc())
-        # Log the error message.
-        push_error_to_driver(
-            worker,
-            ray_constants.REGISTER_ACTOR_PUSH_ERROR,
-            traceback_str,
-            driver_id,
-            data={"actor_id": actor_id_str})
-        # TODO(rkn): In the future, it might make sense to have the worker exit
-        # here. However, currently that would lead to hanging if someone calls
-        # ray.get on a method invoked on the actor.
-    else:
-        # TODO(pcm): Why is the below line necessary?
-        unpickled_class.__module__ = module
-        worker.actors[actor_id_str] = unpickled_class.__new__(unpickled_class)
-
-        def pred(x):
-            return (inspect.isfunction(x) or inspect.ismethod(x)
-                    or is_cython(x))
-
-        actor_methods = inspect.getmembers(unpickled_class, predicate=pred)
-        for actor_method_name, actor_method in actor_methods:
-            function_id = compute_actor_method_function_id(
-                class_name, actor_method_name).id()
-            executor = make_actor_method_executor(
-                worker, actor_method_name, actor_method, actor_imported=True)
-            worker.function_execution_info[driver_id][function_id] = (
-                ray.worker.FunctionExecutionInfo(
-                    function=executor,
-                    function_name=actor_method_name,
-                    max_calls=0))
-            # We do not set worker.function_properties[driver_id][function_id]
-            # because we currently do need the actor worker to submit new tasks
-            # for the actor.
-
-
-def publish_actor_class_to_key(key, actor_class_info, worker):
-    """Push an actor class definition to Redis.
-
-    The is factored out as a separate function because it is also called
-    on cached actor class definitions when a worker connects for the first
-    time.
-
-    Args:
-        key: The key to store the actor class info at.
-        actor_class_info: Information about the actor class.
-        worker: The worker to use to connect to Redis.
+        If a checkpoint exists, this returns a tuple of the number of tasks
+            included in the checkpoint, the saved checkpoint state, and the
+            task frontier at the time of the checkpoint. If no checkpoint
+            exists, all objects are set to None.  The checkpoint index is the .
+            executed on the actor before the checkpoint was made.
     """
-    # We set the driver ID here because it may not have been available when the
-    # actor class was defined.
-    actor_class_info["driver_id"] = worker.task_driver_id.id()
-    worker.redis_client.hmset(key, actor_class_info)
-    worker.redis_client.rpush("Exports", key)
-
-
-def export_actor_class(class_id, Class, actor_method_names,
-                       checkpoint_interval, worker):
-    key = b"ActorClass:" + class_id
-    actor_class_info = {
-        "class_name": Class.__name__,
-        "module": Class.__module__,
-        "class": pickle.dumps(Class),
-        "checkpoint_interval": checkpoint_interval,
-        "actor_method_names": json.dumps(list(actor_method_names))
-    }
-
-    check_oversized_pickle(actor_class_info["class"],
-                           actor_class_info["class_name"], "actor", worker)
-
-    if worker.mode is None:
-        # This means that 'ray.init()' has not been called yet and so we must
-        # cache the actor class definition and export it when 'ray.init()' is
-        # called.
-        assert worker.cached_remote_functions_and_actors is not None
-        worker.cached_remote_functions_and_actors.append(
-            ("actor", (key, actor_class_info)))
-        # This caching code path is currently not used because we only export
-        # actor class definitions lazily when we instantiate the actor for the
-        # first time.
-        assert False, "This should be unreachable."
-    else:
-        publish_actor_class_to_key(key, actor_class_info, worker)
-    # TODO(rkn): Currently we allow actor classes to be defined within tasks.
-    # I tried to disable this, but it may be necessary because of
-    # https://github.com/ray-project/ray/issues/1146.
+    actor_key = b"Actor:" + actor_id
+    checkpoint_index, checkpoint, frontier = worker.redis_client.hmget(
+        actor_key, ["checkpoint_index", "checkpoint", "frontier"])
+    if checkpoint_index is not None:
+        checkpoint_index = int(checkpoint_index)
+    return checkpoint_index, checkpoint, frontier
 
 
 def method(*args, **kwargs):
@@ -466,9 +225,15 @@ def __call__(self, *args, **kwargs):
                                                        self._method_name))
 
     def remote(self, *args, **kwargs):
-        return self._submit(args, kwargs)
+        return self._remote(args, kwargs)
 
     def _submit(self, args, kwargs, num_return_vals=None):
+        logger.warn(
+            "WARNING: _submit() is being deprecated. Please use _remote().")
+        return self._remote(
+            args=args, kwargs=kwargs, num_return_vals=num_return_vals)
+
+    def _remote(self, args, kwargs, num_return_vals=None):
         if num_return_vals is None:
             num_return_vals = self._num_return_vals
 
@@ -518,13 +283,8 @@ def __init__(self, modified_class, class_id, checkpoint_interval, num_cpus,
         self._actor_method_cpus = actor_method_cpus
         self._exported = False
 
-        # Get the actor methods of the given class.
-        def pred(x):
-            return (inspect.isfunction(x) or inspect.ismethod(x)
-                    or is_cython(x))
-
         self._actor_methods = inspect.getmembers(
-            self._modified_class, predicate=pred)
+            self._modified_class, ray.utils.is_function_or_method)
         # Extract the signatures of each of the methods. This will be used
         # to catch some errors if the methods are called with inappropriate
         # arguments.
@@ -537,7 +297,7 @@ def pred(x):
             # don't support, there may not be much the user can do about it.
             signature.check_signature_supported(method, warn=True)
             self._method_signatures[method_name] = signature.extract_signature(
-                method, ignore_first=not is_classmethod(method))
+                method, ignore_first=not ray.utils.is_class_method(method))
 
             # Set the default number of return values for this method.
             if hasattr(method, "__ray_num_return_vals__"):
@@ -568,7 +328,7 @@ def remote(self, *args, **kwargs):
         Returns:
             A handle to the newly created actor.
         """
-        return self._submit(args=args, kwargs=kwargs)
+        return self._remote(args=args, kwargs=kwargs)
 
     def _submit(self,
                 args,
@@ -576,6 +336,21 @@ def _submit(self,
                 num_cpus=None,
                 num_gpus=None,
                 resources=None):
+        logger.warn(
+            "WARNING: _submit() is being deprecated. Please use _remote().")
+        return self._remote(
+            args=args,
+            kwargs=kwargs,
+            num_cpus=num_cpus,
+            num_gpus=num_gpus,
+            resources=resources)
+
+    def _remote(self,
+                args,
+                kwargs,
+                num_cpus=None,
+                num_gpus=None,
+                resources=None):
         """Create an actor.
 
         This method allows more flexibility than the remote method because
@@ -614,15 +389,24 @@ def _submit(self,
         else:
             # Export the actor.
             if not self._exported:
-                export_actor_class(self._class_id, self._modified_class,
-                                   self._actor_method_names,
-                                   self._checkpoint_interval, worker)
+                worker.function_actor_manager.export_actor_class(
+                    self._class_id, self._modified_class,
+                    self._actor_method_names, self._checkpoint_interval)
                 self._exported = True
 
             resources = ray.utils.resources_from_resource_arguments(
                 self._num_cpus, self._num_gpus, self._resources, num_cpus,
                 num_gpus, resources)
 
+            # If the actor methods require CPU resources, then set the required
+            # placement resources. If actor_placement_resources is empty, then
+            # the required placement resources will be the same as resources.
+            actor_placement_resources = {}
+            assert self._actor_method_cpus in [0, 1]
+            if self._actor_method_cpus == 1:
+                actor_placement_resources = resources.copy()
+                actor_placement_resources["CPU"] += 1
+
             creation_args = [self._class_id]
             function_id = compute_actor_creation_function_id(self._class_id)
             [actor_cursor] = worker.submit_task(
@@ -630,7 +414,8 @@ def _submit(self,
                 creation_args,
                 actor_creation_id=actor_id,
                 num_return_vals=1,
-                resources=resources)
+                resources=resources,
+                placement_resources=actor_placement_resources)
 
         # We initialize the actor counter at 1 to account for the actor
         # creation task.
@@ -741,6 +526,7 @@ def __init__(self,
         self._ray_actor_method_cpus = actor_method_cpus
         self._ray_actor_driver_id = actor_driver_id
         self._ray_previous_actor_handle_id = previous_actor_handle_id
+        self._ray_previously_generated_actor_handle_id = None
 
     def _actor_method_call(self,
                            method_name,
@@ -794,15 +580,27 @@ def _actor_method_call(self,
 
         is_actor_checkpoint_method = (method_name == "__ray_checkpoint__")
 
+        # Right now, if the actor handle has been pickled, we create a
+        # temporary actor handle id for invocations.
+        # TODO(pcm): This still leads to a lot of actor handles being
+        # created, there should be a better way to handle pickled
+        # actor handles.
         if self._ray_actor_handle_id is None:
             actor_handle_id = compute_actor_handle_id_non_forked(
                 self._ray_actor_id, self._ray_previous_actor_handle_id,
                 worker.current_task_id)
+            # Each new task creates a new actor handle id, so we need to
+            # reset the actor counter to 0
+            if (actor_handle_id !=
+                    self._ray_previously_generated_actor_handle_id):
+                self._ray_actor_counter = 0
+                self._ray_previously_generated_actor_handle_id = (
+                    actor_handle_id)
         else:
             actor_handle_id = self._ray_actor_handle_id
 
-        function_id = compute_actor_method_function_id(self._ray_class_name,
-                                                       method_name)
+        function_id = FunctionActorManager.compute_actor_method_function_id(
+            self._ray_class_name, method_name)
         object_ids = worker.submit_task(
             function_id,
             args,
@@ -816,6 +614,7 @@ def _actor_method_call(self,
             # We add one for the dummy return ID.
             num_return_vals=num_return_vals + 1,
             resources={"CPU": self._ray_actor_method_cpus},
+            placement_resources={},
             driver_id=self._ray_actor_driver_id)
         # Update the actor counter and cursor to reflect the most recent
         # invocation.
@@ -983,8 +782,8 @@ def __ray_terminate__(self):
                 # this is so that when the worker kills itself below, the local
                 # scheduler won't push an error message to the driver.
                 worker.local_scheduler_client.disconnect()
-                import os
-                os._exit(0)
+                sys.exit(0)
+                assert False, "This process should have terminated."
 
         def __ray_save_checkpoint__(self):
             if hasattr(self, "__ray_save__"):
@@ -1068,5 +867,4 @@ def __ray_checkpoint_restore__(self):
                       resources, actor_method_cpus)
 
 
-ray.worker.global_worker.fetch_and_register_actor = fetch_and_register_actor
 ray.worker.global_worker.make_actor = make_actor
diff --git a/python/ray/autoscaler/autoscaler.py b/python/ray/autoscaler/autoscaler.py
index 2a3734ba403c3..9c4a452ee2687 100644
--- a/python/ray/autoscaler/autoscaler.py
+++ b/python/ray/autoscaler/autoscaler.py
@@ -69,6 +69,7 @@
             "project_id": (None, OPTIONAL),  # gcp project id, if using gcp
             "head_ip": (str, OPTIONAL),  # local cluster head node
             "worker_ips": (list, OPTIONAL),  # local cluster worker nodes
+            "use_internal_ips": (bool, OPTIONAL),  # don't require public ips
         },
         REQUIRED),
 
@@ -490,8 +491,10 @@ def files_up_to_date(self, node_id):
     def recover_if_needed(self, node_id):
         if not self.can_update(node_id):
             return
-        last_heartbeat_time = self.load_metrics.last_heartbeat_time_by_ip.get(
-            self.provider.internal_ip(node_id), 0)
+        key = self.provider.internal_ip(node_id)
+        if key not in self.load_metrics.last_heartbeat_time_by_ip:
+            self.load_metrics.last_heartbeat_time_by_ip[key] = time.time()
+        last_heartbeat_time = self.load_metrics.last_heartbeat_time_by_ip[key]
         delta = time.time() - last_heartbeat_time
         if delta < AUTOSCALER_HEARTBEAT_TIMEOUT_S:
             return
diff --git a/python/ray/autoscaler/aws/config.py b/python/ray/autoscaler/aws/config.py
index 8e5d3a4daffc5..62e0b25ee2e2d 100644
--- a/python/ray/autoscaler/aws/config.py
+++ b/python/ray/autoscaler/aws/config.py
@@ -10,6 +10,7 @@
 
 import boto3
 from botocore.config import Config
+import botocore
 
 from ray.ray_constants import BOTO_MAX_RETRIES
 
@@ -114,7 +115,8 @@ def _configure_key_pair(config):
     ec2 = _resource("ec2", config)
 
     # Try a few times to get or create a good key pair.
-    for i in range(10):
+    MAX_NUM_KEYS = 20
+    for i in range(MAX_NUM_KEYS):
         key_name, key_path = key_pair(i, config["provider"]["region"])
         key = _get_key(key_name, config)
 
@@ -131,7 +133,12 @@ def _configure_key_pair(config):
             os.chmod(key_path, 0o600)
             break
 
-    assert key, "AWS keypair {} not found for {}".format(key_name, key_path)
+    if not key:
+        raise ValueError(
+            "No matching local key file for any of the key pairs in this "
+            "account with ids from 0..{}. ".format(key_name) +
+            "Consider deleting some unused keys pairs from your account.")
+
     assert os.path.exists(key_path), \
         "Private key file {} not found for {}".format(key_path, key_name)
 
@@ -146,9 +153,10 @@ def _configure_key_pair(config):
 
 def _configure_subnet(config):
     ec2 = _resource("ec2", config)
+    use_internal_ips = config["provider"].get("use_internal_ips", False)
     subnets = sorted(
-        (s for s in ec2.subnets.all()
-         if s.state == "available" and s.map_public_ip_on_launch),
+        (s for s in ec2.subnets.all() if s.state == "available" and (
+            use_internal_ips or s.map_public_ip_on_launch)),
         reverse=True,  # sort from Z-A
         key=lambda subnet: subnet.availability_zone)
     if not subnets:
@@ -156,7 +164,8 @@ def _configure_subnet(config):
             "No usable subnets found, try manually creating an instance in "
             "your specified region to populate the list of subnets "
             "and trying this again. Note that the subnet must map public IPs "
-            "on instance launch.")
+            "on instance launch unless you set 'use_internal_ips': True in "
+            "the 'provider' config.")
     if "availability_zone" in config["provider"]:
         azs = config["provider"]["availability_zone"].split(',')
         subnets = [s for s in subnets if s.availability_zone in azs]
@@ -264,7 +273,7 @@ def _get_role(role_name, config):
     try:
         role.load()
         return role
-    except Exception:
+    except botocore.errorfactory.NoSuchEntityException:
         return None
 
 
@@ -274,7 +283,7 @@ def _get_instance_profile(profile_name, config):
     try:
         profile.load()
         return profile
-    except Exception:
+    except botocore.errorfactory.NoSuchEntityException:
         return None
 
 
diff --git a/python/ray/autoscaler/aws/example-full.yaml b/python/ray/autoscaler/aws/example-full.yaml
index 55691863fffb1..d74d45823c211 100644
--- a/python/ray/autoscaler/aws/example-full.yaml
+++ b/python/ray/autoscaler/aws/example-full.yaml
@@ -89,9 +89,9 @@ setup_commands:
     # has your Ray repo pre-cloned. Then, you can replace the pip installs
     # below with a git checkout <your_sha> (and possibly a recompile).
     - echo 'export PATH="$HOME/anaconda3/envs/tensorflow_p36/bin:$PATH"' >> ~/.bashrc
-    # - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp27-cp27mu-manylinux1_x86_64.whl
-    # - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp35-cp35m-manylinux1_x86_64.whl
-    - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp36-cp36m-manylinux1_x86_64.whl
+    # - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp27-cp27mu-manylinux1_x86_64.whl
+    # - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp35-cp35m-manylinux1_x86_64.whl
+    - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp36-cp36m-manylinux1_x86_64.whl
     # Consider uncommenting these if you also want to run apt-get commands during setup
     # - sudo pkill -9 apt-get || true
     # - sudo pkill -9 dpkg || true
diff --git a/python/ray/autoscaler/commands.py b/python/ray/autoscaler/commands.py
index 91d3e4b6b0713..9c63725296df9 100644
--- a/python/ray/autoscaler/commands.py
+++ b/python/ray/autoscaler/commands.py
@@ -189,7 +189,7 @@ def get_or_create_head_node(config, config_file, no_restart, restart_only, yes,
     logger.info("Head node up-to-date, IP address is: {}".format(
         provider.external_ip(head_node)))
 
-    monitor_str = "tail -n 100 -f /tmp/raylogs/monitor-*"
+    monitor_str = "tail -n 100 -f /tmp/ray/session_*/logs/monitor*"
     for s in init_commands:
         if ("ray start" in s and "docker exec" in s
                 and "--autoscaling-config" in s):
diff --git a/python/ray/autoscaler/gcp/example-full.yaml b/python/ray/autoscaler/gcp/example-full.yaml
index e9a95e8543be4..6afbb464fa6a0 100644
--- a/python/ray/autoscaler/gcp/example-full.yaml
+++ b/python/ray/autoscaler/gcp/example-full.yaml
@@ -124,9 +124,9 @@ setup_commands:
       pip install
       google-api-python-client==1.6.7
       cython==0.27.3
-    # - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp27-cp27mu-manylinux1_x86_64.whl
-    # - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp35-cp35m-manylinux1_x86_64.whl
-    # - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.5.2-cp36-cp36m-manylinux1_x86_64.whl
+    # - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp27-cp27mu-manylinux1_x86_64.whl
+    # - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp35-cp35m-manylinux1_x86_64.whl
+    # - pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp36-cp36m-manylinux1_x86_64.whl
     - >-
       cd ~
       && git clone https://github.com/ray-project/ray || true
diff --git a/python/ray/autoscaler/updater.py b/python/ray/autoscaler/updater.py
index b132971d2fc53..1d6b5e23b3840 100644
--- a/python/ray/autoscaler/updater.py
+++ b/python/ray/autoscaler/updater.py
@@ -47,7 +47,8 @@ def __init__(self,
         self.daemon = True
         self.process_runner = process_runner
         self.node_id = node_id
-        self.use_internal_ip = use_internal_ip
+        self.use_internal_ip = (use_internal_ip or provider_config.get(
+            "use_internal_ips", False))
         self.provider = get_node_provider(provider_config, cluster_name)
         self.ssh_private_key = auth_config["ssh_private_key"]
         self.ssh_user = auth_config["ssh_user"]
diff --git a/python/ray/common/redis_module/.gitkeep b/python/ray/common/redis_module/.gitkeep
deleted file mode 100644
index e69de29bb2d1d..0000000000000
diff --git a/python/ray/common/redis_module/runtest.py b/python/ray/common/redis_module/runtest.py
deleted file mode 100644
index 7a7d25c6bedc0..0000000000000
--- a/python/ray/common/redis_module/runtest.py
+++ /dev/null
@@ -1,451 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import os
-import redis
-import sys
-import time
-import unittest
-
-import ray.gcs_utils
-import ray.services
-
-
-def integerToAsciiHex(num, numbytes):
-    retstr = b""
-    # Support 32 and 64 bit architecture.
-    assert (numbytes == 4 or numbytes == 8)
-    for i in range(numbytes):
-        curbyte = num & 0xff
-        if sys.version_info >= (3, 0):
-            retstr += bytes([curbyte])
-        else:
-            retstr += chr(curbyte)
-        num = num >> 8
-
-    return retstr
-
-
-def get_next_message(pubsub_client, timeout_seconds=10):
-    """Block until the next message is available on the pubsub channel."""
-    start_time = time.time()
-    while True:
-        message = pubsub_client.get_message()
-        if message is not None:
-            return message
-        time.sleep(0.1)
-        if time.time() - start_time > timeout_seconds:
-            raise Exception("Timed out while waiting for next message.")
-
-
-class TestGlobalStateStore(unittest.TestCase):
-    def setUp(self):
-        unused_primary_redis_addr, redis_shards = ray.services.start_redis(
-            "localhost", use_credis="RAY_USE_NEW_GCS" in os.environ)
-        self.redis = redis.StrictRedis(
-            host="localhost", port=redis_shards[0].split(":")[-1], db=0)
-
-    def tearDown(self):
-        ray.services.cleanup()
-
-    def testInvalidObjectTableAdd(self):
-        # Check that Redis returns an error when RAY.OBJECT_TABLE_ADD is called
-        # with the wrong arguments.
-        with self.assertRaises(redis.ResponseError):
-            self.redis.execute_command("RAY.OBJECT_TABLE_ADD")
-        with self.assertRaises(redis.ResponseError):
-            self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "hello")
-        with self.assertRaises(redis.ResponseError):
-            self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id2",
-                                       "one", "hash2", "manager_id1")
-        with self.assertRaises(redis.ResponseError):
-            self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id2", 1,
-                                       "hash2", "manager_id1",
-                                       "extra argument")
-        # Check that Redis returns an error when RAY.OBJECT_TABLE_ADD adds an
-        # object ID that is already present with a different hash.
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 1,
-                                   "hash1", "manager_id1")
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(set(response), {b"manager_id1"})
-        with self.assertRaises(redis.ResponseError):
-            self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 1,
-                                       "hash2", "manager_id2")
-        # Check that the second manager was added, even though the hash was
-        # mismatched.
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(set(response), {b"manager_id1", b"manager_id2"})
-        # Check that it is fine if we add the same object ID multiple times
-        # with the most recent hash.
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 1,
-                                   "hash2", "manager_id1")
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 1,
-                                   "hash2", "manager_id1")
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 1,
-                                   "hash2", "manager_id2")
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 2,
-                                   "hash2", "manager_id2")
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(set(response), {b"manager_id1", b"manager_id2"})
-
-    def testObjectTableAddAndLookup(self):
-        # Try calling RAY.OBJECT_TABLE_LOOKUP with an object ID that has not
-        # been added yet.
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(response, None)
-        # Add some managers and try again.
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 1,
-                                   "hash1", "manager_id1")
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 1,
-                                   "hash1", "manager_id2")
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(set(response), {b"manager_id1", b"manager_id2"})
-        # Add a manager that already exists again and try again.
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 1,
-                                   "hash1", "manager_id2")
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(set(response), {b"manager_id1", b"manager_id2"})
-        # Check that we properly handle NULL characters. In the past, NULL
-        # characters were handled improperly causing a "hash mismatch" error if
-        # two object IDs that agreed up to the NULL character were inserted
-        # with different hashes.
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "\x00object_id3", 1,
-                                   "hash1", "manager_id1")
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "\x00object_id4", 1,
-                                   "hash2", "manager_id1")
-        # Check that NULL characters in the hash are handled properly.
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id3", 1,
-                                   "\x00hash1", "manager_id1")
-        with self.assertRaises(redis.ResponseError):
-            self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id3", 1,
-                                       "\x00hash2", "manager_id1")
-
-    def testObjectTableAddAndRemove(self):
-        # Try removing a manager from an object ID that has not been added yet.
-        with self.assertRaises(redis.ResponseError):
-            self.redis.execute_command("RAY.OBJECT_TABLE_REMOVE", "object_id1",
-                                       "manager_id1")
-        # Try calling RAY.OBJECT_TABLE_LOOKUP with an object ID that has not
-        # been added yet.
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(response, None)
-        # Add some managers and try again.
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 1,
-                                   "hash1", "manager_id1")
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 1,
-                                   "hash1", "manager_id2")
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(set(response), {b"manager_id1", b"manager_id2"})
-        # Remove a manager that doesn't exist, and make sure we still have the
-        # same set.
-        self.redis.execute_command("RAY.OBJECT_TABLE_REMOVE", "object_id1",
-                                   "manager_id3")
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(set(response), {b"manager_id1", b"manager_id2"})
-        # Remove a manager that does exist. Make sure it gets removed the first
-        # time and does nothing the second time.
-        self.redis.execute_command("RAY.OBJECT_TABLE_REMOVE", "object_id1",
-                                   "manager_id1")
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(set(response), {b"manager_id2"})
-        self.redis.execute_command("RAY.OBJECT_TABLE_REMOVE", "object_id1",
-                                   "manager_id1")
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(set(response), {b"manager_id2"})
-        # Remove the last manager, and make sure we have an empty set.
-        self.redis.execute_command("RAY.OBJECT_TABLE_REMOVE", "object_id1",
-                                   "manager_id2")
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(set(response), set())
-        # Remove a manager from an empty set, and make sure we now have an
-        # empty set.
-        self.redis.execute_command("RAY.OBJECT_TABLE_REMOVE", "object_id1",
-                                   "manager_id3")
-        response = self.redis.execute_command("RAY.OBJECT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertEqual(set(response), set())
-
-    def testObjectTableSubscribeToNotifications(self):
-        # Define a helper method for checking the contents of object
-        # notifications.
-        def check_object_notification(notification_message, object_id,
-                                      object_size, manager_ids):
-            notification_object = (ray.gcs_utils.SubscribeToNotificationsReply.
-                                   GetRootAsSubscribeToNotificationsReply(
-                                       notification_message, 0))
-            self.assertEqual(notification_object.ObjectId(), object_id)
-            self.assertEqual(notification_object.ObjectSize(), object_size)
-            self.assertEqual(notification_object.ManagerIdsLength(),
-                             len(manager_ids))
-            for i in range(len(manager_ids)):
-                self.assertEqual(
-                    notification_object.ManagerIds(i), manager_ids[i])
-
-        data_size = 0xf1f0
-        p = self.redis.pubsub()
-        # Subscribe to an object ID.
-        p.psubscribe("{}manager_id1".format(
-            ray.gcs_utils.OBJECT_CHANNEL_PREFIX))
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1",
-                                   data_size, "hash1", "manager_id2")
-        # Receive the acknowledgement message.
-        self.assertEqual(get_next_message(p)["data"], 1)
-        # Request a notification and receive the data.
-        self.redis.execute_command("RAY.OBJECT_TABLE_REQUEST_NOTIFICATIONS",
-                                   "manager_id1", "object_id1")
-        # Verify that the notification is correct.
-        check_object_notification(
-            get_next_message(p)["data"], b"object_id1", data_size,
-            [b"manager_id2"])
-
-        # Request a notification for an object that isn't there. Then add the
-        # object and receive the data. Only the first call to
-        # RAY.OBJECT_TABLE_ADD should trigger notifications.
-        self.redis.execute_command("RAY.OBJECT_TABLE_REQUEST_NOTIFICATIONS",
-                                   "manager_id1", "object_id2", "object_id3")
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id3",
-                                   data_size, "hash1", "manager_id1")
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id3",
-                                   data_size, "hash1", "manager_id2")
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id3",
-                                   data_size, "hash1", "manager_id3")
-        # Verify that the notification is correct.
-        check_object_notification(
-            get_next_message(p)["data"], b"object_id3", data_size,
-            [b"manager_id1"])
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id2",
-                                   data_size, "hash1", "manager_id3")
-        # Verify that the notification is correct.
-        check_object_notification(
-            get_next_message(p)["data"], b"object_id2", data_size,
-            [b"manager_id3"])
-        # Request notifications for object_id3 again.
-        self.redis.execute_command("RAY.OBJECT_TABLE_REQUEST_NOTIFICATIONS",
-                                   "manager_id1", "object_id3")
-        # Verify that the notification is correct.
-        check_object_notification(
-            get_next_message(p)["data"], b"object_id3", data_size,
-            [b"manager_id1", b"manager_id2", b"manager_id3"])
-
-    def testResultTableAddAndLookup(self):
-        def check_result_table_entry(message, task_id, is_put):
-            result_table_reply = (
-                ray.gcs_utils.ResultTableReply.GetRootAsResultTableReply(
-                    message, 0))
-            self.assertEqual(result_table_reply.TaskId(), task_id)
-            self.assertEqual(result_table_reply.IsPut(), is_put)
-
-        # Try looking up something in the result table before anything is
-        # added.
-        response = self.redis.execute_command("RAY.RESULT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertIsNone(response)
-        # Adding the object to the object table should have no effect.
-        self.redis.execute_command("RAY.OBJECT_TABLE_ADD", "object_id1", 1,
-                                   "hash1", "manager_id1")
-        response = self.redis.execute_command("RAY.RESULT_TABLE_LOOKUP",
-                                              "object_id1")
-        self.assertIsNone(response)
-        # Add the result to the result table. The lookup now returns the task
-        # ID.
-        task_id = b"task_id1"
-        self.redis.execute_command("RAY.RESULT_TABLE_ADD", "object_id1",
-                                   task_id, 0)
-        response = self.redis.execute_command("RAY.RESULT_TABLE_LOOKUP",
-                                              "object_id1")
-        check_result_table_entry(response, task_id, False)
-        # Doing it again should still work.
-        response = self.redis.execute_command("RAY.RESULT_TABLE_LOOKUP",
-                                              "object_id1")
-        check_result_table_entry(response, task_id, False)
-        # Try another result table lookup. This should succeed.
-        task_id = b"task_id2"
-        self.redis.execute_command("RAY.RESULT_TABLE_ADD", "object_id2",
-                                   task_id, 1)
-        response = self.redis.execute_command("RAY.RESULT_TABLE_LOOKUP",
-                                              "object_id2")
-        check_result_table_entry(response, task_id, True)
-
-    def testInvalidTaskTableAdd(self):
-        # Check that Redis returns an error when RAY.TASK_TABLE_ADD is called
-        # with the wrong arguments.
-        with self.assertRaises(redis.ResponseError):
-            self.redis.execute_command("RAY.TASK_TABLE_ADD")
-        with self.assertRaises(redis.ResponseError):
-            self.redis.execute_command("RAY.TASK_TABLE_ADD", "hello")
-        with self.assertRaises(redis.ResponseError):
-            self.redis.execute_command("RAY.TASK_TABLE_ADD", "task_id", 3,
-                                       "node_id")
-        with self.assertRaises(redis.ResponseError):
-            # Non-integer scheduling states should not be added.
-            self.redis.execute_command("RAY.TASK_TABLE_ADD", "task_id",
-                                       "invalid_state", "node_id", "task_spec")
-        with self.assertRaises(redis.ResponseError):
-            # Should not be able to update a non-existent task.
-            self.redis.execute_command("RAY.TASK_TABLE_UPDATE", "task_id", 10,
-                                       "node_id", b"")
-
-    def testTaskTableAddAndLookup(self):
-        TASK_STATUS_WAITING = 1
-        TASK_STATUS_SCHEDULED = 2
-        TASK_STATUS_QUEUED = 4
-
-        # make sure somebody will get a notification (checked in the redis
-        # module)
-        p = self.redis.pubsub()
-        p.psubscribe("{prefix}*:*".format(prefix=ray.gcs_utils.TASK_PREFIX))
-
-        def check_task_reply(message, task_args, updated=False):
-            (task_status, local_scheduler_id, execution_dependencies_string,
-             spillback_count, task_spec) = task_args
-            task_reply_object = ray.gcs_utils.TaskReply.GetRootAsTaskReply(
-                message, 0)
-            self.assertEqual(task_reply_object.State(), task_status)
-            self.assertEqual(task_reply_object.LocalSchedulerId(),
-                             local_scheduler_id)
-            self.assertEqual(task_reply_object.SpillbackCount(),
-                             spillback_count)
-            self.assertEqual(task_reply_object.TaskSpec(), task_spec)
-            self.assertEqual(task_reply_object.Updated(), updated)
-
-        # Check that task table adds, updates, and lookups work correctly.
-        task_args = [TASK_STATUS_WAITING, b"node_id", b"", 0, b"task_spec"]
-        response = self.redis.execute_command("RAY.TASK_TABLE_ADD", "task_id",
-                                              *task_args)
-        response = self.redis.execute_command("RAY.TASK_TABLE_GET", "task_id")
-        check_task_reply(response, task_args)
-
-        task_args[0] = TASK_STATUS_SCHEDULED
-        self.redis.execute_command("RAY.TASK_TABLE_UPDATE", "task_id",
-                                   *task_args[:4])
-        response = self.redis.execute_command("RAY.TASK_TABLE_GET", "task_id")
-        check_task_reply(response, task_args)
-
-        # If the current value, test value, and set value are all the same, the
-        # update happens, and the response is still the same task.
-        task_args = [task_args[0]] + task_args
-        response = self.redis.execute_command("RAY.TASK_TABLE_TEST_AND_UPDATE",
-                                              "task_id", *task_args[:3])
-        check_task_reply(response, task_args[1:], updated=True)
-        # Check that the task entry is still the same.
-        get_response = self.redis.execute_command("RAY.TASK_TABLE_GET",
-                                                  "task_id")
-        check_task_reply(get_response, task_args[1:])
-
-        # If the current value is the same as the test value, and the set value
-        # is different, the update happens, and the response is the entire
-        # task.
-        task_args[1] = TASK_STATUS_QUEUED
-        response = self.redis.execute_command("RAY.TASK_TABLE_TEST_AND_UPDATE",
-                                              "task_id", *task_args[:3])
-        check_task_reply(response, task_args[1:], updated=True)
-        # Check that the update happened.
-        get_response = self.redis.execute_command("RAY.TASK_TABLE_GET",
-                                                  "task_id")
-        check_task_reply(get_response, task_args[1:])
-
-        # If the current value is no longer the same as the test value, the
-        # response is the same task as before the test-and-set.
-        new_task_args = task_args[:]
-        new_task_args[1] = TASK_STATUS_WAITING
-        response = self.redis.execute_command("RAY.TASK_TABLE_TEST_AND_UPDATE",
-                                              "task_id", *new_task_args[:3])
-        check_task_reply(response, task_args[1:], updated=False)
-        # Check that the update did not happen.
-        get_response2 = self.redis.execute_command("RAY.TASK_TABLE_GET",
-                                                   "task_id")
-        self.assertEqual(get_response2, get_response)
-
-        # If the test value is a bitmask that matches the current value, the
-        # update happens.
-        task_args = new_task_args
-        task_args[0] = TASK_STATUS_SCHEDULED | TASK_STATUS_QUEUED
-        response = self.redis.execute_command("RAY.TASK_TABLE_TEST_AND_UPDATE",
-                                              "task_id", *task_args[:3])
-        check_task_reply(response, task_args[1:], updated=True)
-
-        # If the test value is a bitmask that does not match the current value,
-        # the update does not happen, and the response is the same task as
-        # before the test-and-set.
-        new_task_args = task_args[:]
-        new_task_args[0] = TASK_STATUS_SCHEDULED
-        old_response = response
-        response = self.redis.execute_command("RAY.TASK_TABLE_TEST_AND_UPDATE",
-                                              "task_id", *new_task_args[:3])
-        check_task_reply(response, task_args[1:], updated=False)
-        # Check that the update did not happen.
-        get_response = self.redis.execute_command("RAY.TASK_TABLE_GET",
-                                                  "task_id")
-        self.assertNotEqual(get_response, old_response)
-        check_task_reply(get_response, task_args[1:])
-
-    def check_task_subscription(self, p, scheduling_state, local_scheduler_id):
-        task_args = [
-            b"task_id", scheduling_state,
-            local_scheduler_id.encode("ascii"), b"", 0, b"task_spec"
-        ]
-        self.redis.execute_command("RAY.TASK_TABLE_ADD", *task_args)
-        # Receive the data.
-        message = get_next_message(p)["data"]
-        # Check that the notification object is correct.
-        notification_object = ray.gcs_utils.TaskReply.GetRootAsTaskReply(
-            message, 0)
-        self.assertEqual(notification_object.TaskId(), task_args[0])
-        self.assertEqual(notification_object.State(), task_args[1])
-        self.assertEqual(notification_object.LocalSchedulerId(), task_args[2])
-        self.assertEqual(notification_object.ExecutionDependencies(),
-                         task_args[3])
-        self.assertEqual(notification_object.TaskSpec(), task_args[-1])
-
-    def testTaskTableSubscribe(self):
-        scheduling_state = 1
-        local_scheduler_id = "local_scheduler_id"
-        # Subscribe to the task table.
-        p = self.redis.pubsub()
-        p.psubscribe("{prefix}*:*".format(prefix=ray.gcs_utils.TASK_PREFIX))
-        # Receive acknowledgment.
-        self.assertEqual(get_next_message(p)["data"], 1)
-        self.check_task_subscription(p, scheduling_state, local_scheduler_id)
-        # unsubscribe to make sure there is only one subscriber at a given time
-        p.punsubscribe("{prefix}*:*".format(prefix=ray.gcs_utils.TASK_PREFIX))
-        # Receive acknowledgment.
-        self.assertEqual(get_next_message(p)["data"], 0)
-
-        p.psubscribe("{prefix}*:{state}".format(
-            prefix=ray.gcs_utils.TASK_PREFIX, state=scheduling_state))
-        # Receive acknowledgment.
-        self.assertEqual(get_next_message(p)["data"], 1)
-        self.check_task_subscription(p, scheduling_state, local_scheduler_id)
-        p.punsubscribe("{prefix}*:{state}".format(
-            prefix=ray.gcs_utils.TASK_PREFIX, state=scheduling_state))
-        # Receive acknowledgment.
-        self.assertEqual(get_next_message(p)["data"], 0)
-
-        p.psubscribe("{prefix}{local_scheduler_id}:*".format(
-            prefix=ray.gcs_utils.TASK_PREFIX,
-            local_scheduler_id=local_scheduler_id))
-        # Receive acknowledgment.
-        self.assertEqual(get_next_message(p)["data"], 1)
-        self.check_task_subscription(p, scheduling_state, local_scheduler_id)
-        p.punsubscribe("{prefix}{local_scheduler_id}:*".format(
-            prefix=ray.gcs_utils.TASK_PREFIX,
-            local_scheduler_id=local_scheduler_id))
-        # Receive acknowledgment.
-        self.assertEqual(get_next_message(p)["data"], 0)
-
-
-if __name__ == "__main__":
-    unittest.main(verbosity=2)
diff --git a/python/ray/common/test/test.py b/python/ray/common/test/test.py
deleted file mode 100644
index cd36b697bbaad..0000000000000
--- a/python/ray/common/test/test.py
+++ /dev/null
@@ -1,181 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import numpy as np
-import pickle
-import sys
-import unittest
-
-import ray.local_scheduler as local_scheduler
-import ray.ray_constants as ray_constants
-
-
-def random_object_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-def random_function_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-def random_driver_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-def random_task_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-BASE_SIMPLE_OBJECTS = [
-    0, 1, 100000, 0.0, 0.5, 0.9, 100000.1, (), [], {}, "", 990 * "h", u"",
-    990 * u"h",
-    np.ones(3),
-    np.array([True, False]), None, True, False
-]
-
-if sys.version_info < (3, 0):
-    BASE_SIMPLE_OBJECTS += [
-        long(0),  # noqa: E501,F821
-        long(1),  # noqa: E501,F821
-        long(100000),  # noqa: E501,F821
-        long(1 << 100)  # noqa: E501,F821
-    ]
-
-LIST_SIMPLE_OBJECTS = [[obj] for obj in BASE_SIMPLE_OBJECTS]
-TUPLE_SIMPLE_OBJECTS = [(obj, ) for obj in BASE_SIMPLE_OBJECTS]
-DICT_SIMPLE_OBJECTS = [{(): obj} for obj in BASE_SIMPLE_OBJECTS]
-
-SIMPLE_OBJECTS = (BASE_SIMPLE_OBJECTS + LIST_SIMPLE_OBJECTS +
-                  TUPLE_SIMPLE_OBJECTS + DICT_SIMPLE_OBJECTS)
-
-# Create some complex objects that cannot be serialized by value in tasks.
-
-lst = []
-lst.append(lst)
-
-
-class Foo(object):
-    def __init__(self):
-        pass
-
-
-BASE_COMPLEX_OBJECTS = [
-    15000 * "h", 15000 * u"h", lst,
-    Foo(), 100 * [100 * [10 * [1]]],
-    np.array([Foo()])
-]
-
-LIST_COMPLEX_OBJECTS = [[obj] for obj in BASE_COMPLEX_OBJECTS]
-TUPLE_COMPLEX_OBJECTS = [(obj, ) for obj in BASE_COMPLEX_OBJECTS]
-DICT_COMPLEX_OBJECTS = [{(): obj} for obj in BASE_COMPLEX_OBJECTS]
-
-COMPLEX_OBJECTS = (BASE_COMPLEX_OBJECTS + LIST_COMPLEX_OBJECTS +
-                   TUPLE_COMPLEX_OBJECTS + DICT_COMPLEX_OBJECTS)
-
-
-class TestSerialization(unittest.TestCase):
-    def test_serialize_by_value(self):
-
-        for val in SIMPLE_OBJECTS:
-            self.assertTrue(local_scheduler.check_simple_value(val))
-        for val in COMPLEX_OBJECTS:
-            self.assertFalse(local_scheduler.check_simple_value(val))
-
-
-class TestObjectID(unittest.TestCase):
-    def test_create_object_id(self):
-        random_object_id()
-
-    def test_cannot_pickle_object_ids(self):
-        object_ids = [random_object_id() for _ in range(256)]
-
-        def f():
-            return object_ids
-
-        def g(val=object_ids):
-            return 1
-
-        def h():
-            object_ids[0]
-            return 1
-
-        # Make sure that object IDs cannot be pickled (including functions that
-        # close over object IDs).
-        self.assertRaises(Exception, lambda: pickle.dumps(object_ids[0]))
-        self.assertRaises(Exception, lambda: pickle.dumps(object_ids))
-        self.assertRaises(Exception, lambda: pickle.dumps(f))
-        self.assertRaises(Exception, lambda: pickle.dumps(g))
-        self.assertRaises(Exception, lambda: pickle.dumps(h))
-
-    def test_equality_comparisons(self):
-        x1 = local_scheduler.ObjectID(ray_constants.ID_SIZE * b"a")
-        x2 = local_scheduler.ObjectID(ray_constants.ID_SIZE * b"a")
-        y1 = local_scheduler.ObjectID(ray_constants.ID_SIZE * b"b")
-        y2 = local_scheduler.ObjectID(ray_constants.ID_SIZE * b"b")
-        self.assertEqual(x1, x2)
-        self.assertEqual(y1, y2)
-        self.assertNotEqual(x1, y1)
-
-        random_strings = [
-            np.random.bytes(ray_constants.ID_SIZE) for _ in range(256)
-        ]
-        object_ids1 = [
-            local_scheduler.ObjectID(random_strings[i]) for i in range(256)
-        ]
-        object_ids2 = [
-            local_scheduler.ObjectID(random_strings[i]) for i in range(256)
-        ]
-        self.assertEqual(len(set(object_ids1)), 256)
-        self.assertEqual(len(set(object_ids1 + object_ids2)), 256)
-        self.assertEqual(set(object_ids1), set(object_ids2))
-
-    def test_hashability(self):
-        x = random_object_id()
-        y = random_object_id()
-        {x: y}
-        {x, y}
-
-
-class TestTask(unittest.TestCase):
-    def check_task(self, task, function_id, num_return_vals, args):
-        self.assertEqual(function_id.id(), task.function_id().id())
-        retrieved_args = task.arguments()
-        self.assertEqual(num_return_vals, len(task.returns()))
-        self.assertEqual(len(args), len(retrieved_args))
-        for i in range(len(retrieved_args)):
-            if isinstance(retrieved_args[i], local_scheduler.ObjectID):
-                self.assertEqual(retrieved_args[i].id(), args[i].id())
-            else:
-                self.assertEqual(retrieved_args[i], args[i])
-
-    def test_create_and_serialize_task(self):
-        # TODO(rkn): The function ID should be a FunctionID object, not an
-        # ObjectID.
-        driver_id = random_driver_id()
-        parent_id = random_task_id()
-        function_id = random_function_id()
-        object_ids = [random_object_id() for _ in range(256)]
-        args_list = [[], 1 * [1], 10 * [1], 100 * [1], 1000 * [1], 1 * ["a"],
-                     10 * ["a"], 100 * ["a"], 1000 * ["a"], [
-                         1, 1.3, 2, 1 << 100, "hi", u"hi", [1, 2]
-                     ], object_ids[:1], object_ids[:2], object_ids[:3],
-                     object_ids[:4], object_ids[:5], object_ids[:10],
-                     object_ids[:100], object_ids[:256], [1, object_ids[0]], [
-                         object_ids[0], "a"
-                     ], [1, object_ids[0], "a"], [
-                         object_ids[0], 1, object_ids[1], "a"
-                     ], object_ids[:3] + [1, "hi", 2.3] + object_ids[:5],
-                     object_ids + 100 * ["a"] + object_ids]
-        for args in args_list:
-            for num_return_vals in [0, 1, 2, 3, 5, 10, 100]:
-                task = local_scheduler.Task(driver_id, function_id, args,
-                                            num_return_vals, parent_id, 0)
-                self.check_task(task, function_id, num_return_vals, args)
-                data = local_scheduler.task_to_string(task)
-                task2 = local_scheduler.task_from_string(data)
-                self.check_task(task2, function_id, num_return_vals, args)
-
-
-if __name__ == "__main__":
-    unittest.main(verbosity=2)
diff --git a/python/ray/common/thirdparty/redis/src/.gitkeep b/python/ray/common/thirdparty/redis/src/.gitkeep
deleted file mode 100644
index e69de29bb2d1d..0000000000000
diff --git a/python/ray/common/__init__.py b/python/ray/core/src/ray/__init__.py
similarity index 100%
rename from python/ray/common/__init__.py
rename to python/ray/core/src/ray/__init__.py
diff --git a/python/ray/core/src/local_scheduler/__init__.py b/python/ray/core/src/ray/raylet/__init__.py
similarity index 100%
rename from python/ray/core/src/local_scheduler/__init__.py
rename to python/ray/core/src/ray/raylet/__init__.py
diff --git a/python/ray/experimental/async_api.py b/python/ray/experimental/async_api.py
new file mode 100644
index 0000000000000..8df8596e29aa5
--- /dev/null
+++ b/python/ray/experimental/async_api.py
@@ -0,0 +1,62 @@
+# Note: asyncio is only compatible with Python 3
+
+import asyncio
+import ray
+from ray.experimental.async_plasma import PlasmaProtocol, PlasmaEventHandler
+
+handler = None
+transport = None
+protocol = None
+
+
+async def _async_init():
+    global handler, transport, protocol
+    if handler is None:
+        worker = ray.worker.global_worker
+        loop = asyncio.get_event_loop()
+        worker.plasma_client.subscribe()
+        rsock = worker.plasma_client.get_notification_socket()
+        handler = PlasmaEventHandler(loop, worker)
+        transport, protocol = await loop.create_connection(
+            lambda: PlasmaProtocol(worker.plasma_client, handler), sock=rsock)
+
+
+def init():
+    """
+    Initialize synchronously.
+    """
+    loop = asyncio.get_event_loop()
+    if loop.is_running():
+        raise Exception("You must initialize the Ray async API by calling "
+                        "async_api.init() or async_api.as_future(obj) before "
+                        "the event loop starts.")
+    else:
+        asyncio.get_event_loop().run_until_complete(_async_init())
+
+
+def as_future(object_id):
+    """Turn an object_id into a Future object.
+
+    Args:
+        object_id: A Ray object_id.
+
+    Returns:
+        PlasmaObjectFuture: A future object that waits the object_id.
+    """
+    if handler is None:
+        init()
+    return handler.as_future(object_id)
+
+
+def shutdown():
+    """Manually shutdown the async API.
+
+    Cancels all related tasks and all the socket transportation.
+    """
+    global handler, transport, protocol
+    if handler is not None:
+        handler.close()
+        transport.close()
+        handler = None
+        transport = None
+        protocol = None
diff --git a/python/ray/experimental/async_plasma.py b/python/ray/experimental/async_plasma.py
new file mode 100644
index 0000000000000..2c0f806f2467b
--- /dev/null
+++ b/python/ray/experimental/async_plasma.py
@@ -0,0 +1,237 @@
+import asyncio
+import ctypes
+import sys
+
+import pyarrow.plasma as plasma
+
+import ray
+from ray.services import logger
+
+INT64_SIZE = ctypes.sizeof(ctypes.c_int64)
+
+
+def _release_waiter(waiter, *_):
+    if not waiter.done():
+        waiter.set_result(None)
+
+
+class PlasmaProtocol(asyncio.Protocol):
+    """Protocol control for the asyncio connection."""
+
+    def __init__(self, plasma_client, plasma_event_handler):
+        self.plasma_client = plasma_client
+        self.plasma_event_handler = plasma_event_handler
+        self.transport = None
+        self._buffer = b""
+
+    def connection_made(self, transport):
+        self.transport = transport
+
+    def data_received(self, data):
+        self._buffer += data
+        messages = []
+        i = 0
+        while i + INT64_SIZE <= len(self._buffer):
+            msg_len = int.from_bytes(self._buffer[i:i + INT64_SIZE],
+                                     sys.byteorder)
+            if i + INT64_SIZE + msg_len > len(self._buffer):
+                break
+            i += INT64_SIZE
+            segment = self._buffer[i:i + msg_len]
+            i += msg_len
+            messages.append(self.plasma_client.decode_notification(segment))
+
+        self._buffer = self._buffer[i:]
+        self.plasma_event_handler.process_notifications(messages)
+
+    def connection_lost(self, exc):
+        # The socket has been closed
+        logger.debug("PlasmaProtocol - connection lost.")
+
+    def eof_received(self):
+        logger.debug("PlasmaProtocol - EOF received.")
+        self.transport.close()
+
+
+class PlasmaObjectFuture(asyncio.Future):
+    """This class manages the lifecycle of a Future contains an object_id.
+
+    Note:
+        This Future is an item in an linked list.
+
+    Attributes:
+        object_id: The object_id this Future contains.
+    """
+
+    def __init__(self, loop, object_id):
+        super().__init__(loop=loop)
+        self.object_id = object_id
+        self.prev = None
+        self.next = None
+
+    @property
+    def ray_object_id(self):
+        return ray.ObjectID(self.object_id.binary())
+
+    def __repr__(self):
+        return super().__repr__() + "{object_id=%s}" % self.object_id
+
+
+class PlasmaObjectLinkedList(asyncio.Future):
+    """This class is a doubly-linked list.
+    It holds a ObjectID and maintains futures assigned to the ObjectID.
+
+    Args:
+        loop: an event loop.
+        plain_object_id (plasma.ObjectID):
+            The plasma ObjectID this class holds.
+    """
+
+    def __init__(self, loop, plain_object_id):
+        super().__init__(loop=loop)
+        assert isinstance(plain_object_id, plasma.ObjectID)
+        self.object_id = plain_object_id
+        self.head = None
+        self.tail = None
+
+    def append(self, future):
+        """Append an object to the linked list.
+
+        Args:
+            future (PlasmaObjectFuture): A PlasmaObjectFuture instance.
+        """
+        future.prev = self.tail
+        if self.tail is None:
+            assert self.head is None
+            self.head = future
+        else:
+            self.tail.next = future
+        self.tail = future
+        # Once done, it will be removed from the list.
+        future.add_done_callback(self.remove)
+
+    def remove(self, future):
+        """Remove an object from the linked list.
+
+        Args:
+            future (PlasmaObjectFuture): A PlasmaObjectFuture instance.
+        """
+        if self._loop.get_debug():
+            logger.debug("Removing %s from the linked list.", future)
+        if future.prev is None:
+            assert future is self.head
+            self.head = future.next
+            if self.head is None:
+                self.tail = None
+                if not self.cancelled():
+                    self.set_result(None)
+            else:
+                self.head.prev = None
+        elif future.next is None:
+            assert future is self.tail
+            self.tail = future.prev
+            if self.tail is None:
+                self.head = None
+                if not self.cancelled():
+                    self.set_result(None)
+            else:
+                self.tail.prev = None
+
+    def cancel(self, *args, **kwargs):
+        """Manually cancel all tasks assigned to this event loop."""
+        # Because remove all futures will trigger `set_result`,
+        # we cancel itself first.
+        super().cancel()
+        for future in self.traverse():
+            # All cancelled futures should have callbacks to removed itself
+            # from this linked list. However, these callbacks are scheduled in
+            # an event loop, so we could still find them in our list.
+            if not future.cancelled():
+                future.cancel()
+
+    def set_result(self, result):
+        """Complete all tasks. """
+        for future in self.traverse():
+            # All cancelled futures should have callbacks to removed itself
+            # from this linked list. However, these callbacks are scheduled in
+            # an event loop, so we could still find them in our list.
+            future.set_result(result)
+        if not self.done():
+            super().set_result(result)
+
+    def traverse(self):
+        """Traverse this linked list.
+
+        Yields:
+            PlasmaObjectFuture: PlasmaObjectFuture instances.
+        """
+        current = self.head
+        while current is not None:
+            yield current
+            current = current.next
+
+
+class PlasmaEventHandler:
+    """This class is an event handler for Plasma."""
+
+    def __init__(self, loop, worker):
+        super().__init__()
+        self._loop = loop
+        self._worker = worker
+        self._waiting_dict = {}
+
+    def process_notifications(self, messages):
+        """Process notifications."""
+        for object_id, object_size, metadata_size in messages:
+            if object_size > 0 and object_id in self._waiting_dict:
+                linked_list = self._waiting_dict[object_id]
+                self._complete_future(linked_list)
+
+    def close(self):
+        """Clean up this handler."""
+        for linked_list in self._waiting_dict.values():
+            linked_list.cancel()
+        # All cancelled linked lists should have callbacks to removed itself
+        # from the waiting dict. However, these callbacks are scheduled in
+        # an event loop, so we don't check them now.
+
+    def _unregister_callback(self, fut):
+        del self._waiting_dict[fut.object_id]
+
+    def _complete_future(self, fut):
+        obj = self._worker.retrieve_and_deserialize([fut.object_id], 0)[0]
+        fut.set_result(obj)
+
+    def as_future(self, object_id, check_ready=True):
+        """Turn an object_id into a Future object.
+
+        Args:
+            object_id: A Ray's object_id.
+            check_ready (bool): If true, check if the object_id is ready.
+
+        Returns:
+            PlasmaObjectFuture: A future object that waits the object_id.
+        """
+        if not isinstance(object_id, ray.ObjectID):
+            raise TypeError("Input should be an ObjectID.")
+
+        plain_object_id = plasma.ObjectID(object_id.id())
+        fut = PlasmaObjectFuture(loop=self._loop, object_id=plain_object_id)
+
+        if check_ready:
+            ready, _ = ray.wait([object_id], timeout=0)
+            if ready:
+                if self._loop.get_debug():
+                    logger.debug("%s has been ready.", plain_object_id)
+                self._complete_future(fut)
+                return fut
+
+        if plain_object_id not in self._waiting_dict:
+            linked_list = PlasmaObjectLinkedList(self._loop, plain_object_id)
+            linked_list.add_done_callback(self._unregister_callback)
+            self._waiting_dict[plain_object_id] = linked_list
+        self._waiting_dict[plain_object_id].append(fut)
+        if self._loop.get_debug():
+            logger.debug("%s added to the waiting list.", fut)
+
+        return fut
diff --git a/python/ray/experimental/sgd/__init__.py b/python/ray/experimental/sgd/__init__.py
index e69de29bb2d1d..005b3fff0c1f0 100644
--- a/python/ray/experimental/sgd/__init__.py
+++ b/python/ray/experimental/sgd/__init__.py
@@ -0,0 +1,11 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from ray.experimental.sgd.sgd import DistributedSGD
+from ray.experimental.sgd.model import Model
+
+__all__ = [
+    "DistributedSGD",
+    "Model",
+]
diff --git a/python/ray/experimental/sgd/mnist_example.py b/python/ray/experimental/sgd/mnist_example.py
new file mode 100755
index 0000000000000..8c2fff213c94b
--- /dev/null
+++ b/python/ray/experimental/sgd/mnist_example.py
@@ -0,0 +1,134 @@
+#!/usr/bin/env python
+"""Example of how to train a model with Ray SGD.
+
+We use a small model here, so no speedup for distributing the computation is
+expected. This example shows:
+    - How to set up a simple input pipeline
+    - How to evaluate model accuracy during training
+    - How to get and set model weights
+    - How to train with ray.experimental.sgd.DistributedSGD
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import argparse
+import time
+
+from tensorflow.examples.tutorials.mnist import input_data
+import tensorflow as tf
+
+import ray
+from ray.tune import run_experiments
+from ray.tune.examples.tune_mnist_ray import deepnn
+from ray.experimental.sgd.model import Model
+from ray.experimental.sgd.sgd import DistributedSGD
+from ray.experimental.tfutils import TensorFlowVariables
+
+parser = argparse.ArgumentParser()
+parser.add_argument("--redis-address", default=None, type=str)
+parser.add_argument("--num-iters", default=10000, type=int)
+parser.add_argument("--batch-size", default=50, type=int)
+parser.add_argument("--num-workers", default=1, type=int)
+parser.add_argument("--devices-per-worker", default=1, type=int)
+parser.add_argument("--tune", action="store_true", help="Run in Ray Tune")
+parser.add_argument(
+    "--strategy", default="ps", type=str, help="One of 'simple' or 'ps'")
+parser.add_argument(
+    "--gpu", action="store_true", help="Use GPUs for optimization")
+
+
+class MNISTModel(Model):
+    def __init__(self):
+        # Import data
+        error = None
+        for _ in range(10):
+            try:
+                self.mnist = input_data.read_data_sets(
+                    "/tmp/tensorflow/mnist/input_data", one_hot=True)
+                error = None
+                break
+            except Exception as e:
+                error = e
+                time.sleep(5)
+        if error:
+            raise ValueError("Failed to import data", error)
+
+        # Set seed and build layers
+        tf.set_random_seed(0)
+        self.x = tf.placeholder(tf.float32, [None, 784], name="x")
+        self.y_ = tf.placeholder(tf.float32, [None, 10], name="y_")
+        y_conv, self.keep_prob = deepnn(self.x)
+
+        # Need to define loss and optimizer attributes
+        self.loss = tf.reduce_mean(
+            tf.nn.softmax_cross_entropy_with_logits(
+                labels=self.y_, logits=y_conv))
+        self.optimizer = tf.train.AdamOptimizer(1e-4)
+        self.variables = TensorFlowVariables(self.loss,
+                                             tf.get_default_session())
+
+        # For evaluating test accuracy
+        correct_prediction = tf.equal(
+            tf.argmax(y_conv, 1), tf.argmax(self.y_, 1))
+        self.accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
+
+    def get_feed_dict(self):
+        batch = self.mnist.train.next_batch(50)
+        return {
+            self.x: batch[0],
+            self.y_: batch[1],
+            self.keep_prob: 0.5,
+        }
+
+    def test_accuracy(self):
+        return self.accuracy.eval(
+            feed_dict={
+                self.x: self.mnist.test.images,
+                self.y_: self.mnist.test.labels,
+                self.keep_prob: 1.0,
+            })
+
+
+def train_mnist(config, reporter):
+    args = config["args"]
+    sgd = DistributedSGD(
+        lambda w_i, d_i: MNISTModel(),
+        num_workers=args.num_workers,
+        devices_per_worker=args.devices_per_worker,
+        gpu=args.gpu,
+        strategy=args.strategy)
+
+    # Important: synchronize the initial weights of all model replicas
+    w0 = sgd.for_model(lambda m: m.variables.get_flat())
+    sgd.foreach_model(lambda m: m.variables.set_flat(w0))
+
+    for i in range(args.num_iters):
+        if i % 10 == 0:
+            start = time.time()
+            loss = sgd.step(fetch_stats=True)["loss"]
+            acc = sgd.foreach_model(lambda model: model.test_accuracy())
+            print("Iter", i, "loss", loss, "accuracy", acc)
+            print("Time per iteration", time.time() - start)
+            assert len(set(acc)) == 1, ("Models out of sync", acc)
+            reporter(timesteps_total=i, mean_loss=loss, mean_accuracy=acc[0])
+        else:
+            sgd.step()
+
+
+if __name__ == "__main__":
+    args = parser.parse_args()
+    ray.init(redis_address=args.redis_address)
+
+    if args.tune:
+        run_experiments({
+            "mnist_sgd": {
+                "run": train_mnist,
+                "config": {
+                    "args": args,
+                },
+            },
+        })
+    else:
+        train_mnist({"args": args}, lambda **kw: None)
diff --git a/python/ray/experimental/sgd/model.py b/python/ray/experimental/sgd/model.py
new file mode 100644
index 0000000000000..ac8e0eedf23ea
--- /dev/null
+++ b/python/ray/experimental/sgd/model.py
@@ -0,0 +1,26 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+
+class Model(object):
+    """Your class must implement this interface to be used with Ray SGD.
+
+    This supports any form of input pipeline: it is up to you to define it
+    using TensorFlow. The only requirements are that the loss and optimizer
+    attributes must be defined.
+
+    For an example implementation, see tfbench/test_model.py
+
+    Attributes:
+        loss (tf.Tensor): Loss function to minimize.
+        optimizer (tf.train.Optimizer): Optimizer to use to minimize the loss.
+    """
+
+    def get_feed_dict(self):
+        """Extra values to pass in when computing gradients for the loss.
+
+        Returns:
+            TensorFlow feed_dict to add to the gradient operation.
+        """
+        return {}
diff --git a/python/ray/experimental/sgd/modified_allreduce.py b/python/ray/experimental/sgd/modified_allreduce.py
index a9d6879f99c7b..7c446aa974e15 100644
--- a/python/ray/experimental/sgd/modified_allreduce.py
+++ b/python/ray/experimental/sgd/modified_allreduce.py
@@ -584,7 +584,15 @@ def end_interval(indices, small_ranges, large_indices):
     if len(small_ranges):
         new_tower_grads = []
         for dev_idx, gv_list in enumerate(tower_grads):
-            assert len(gv_list) == num_gv
+            assert len(gv_list) == num_gv, (
+                "Possible cause: "
+                "Networks constructed on different workers "
+                "don't have the same number of variables. "
+                "If you use tf.GraphKeys or tf.global_variables() "
+                "with multiple graphs per worker during network "
+                "construction, you need to use "
+                "appropriate scopes, see "
+                "https://github.com/ray-project/ray/issues/3136")
             new_gv_list = []
             for r in small_ranges:
                 key = '%d:%d' % (dev_idx, len(new_gv_list))
diff --git a/python/ray/experimental/sgd/param_server.py b/python/ray/experimental/sgd/param_server.py
new file mode 100644
index 0000000000000..517d419c36440
--- /dev/null
+++ b/python/ray/experimental/sgd/param_server.py
@@ -0,0 +1,82 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import logging
+
+import numpy as np
+
+import ray
+from ray.experimental.sgd.util import Timeline, fetch, warmup
+
+logger = logging.getLogger(__name__)
+
+
+@ray.remote(num_cpus=0)
+class ParameterServer(object):
+    """Helper class for ray.experimental.sgd.DistributedSGD."""
+
+    def __init__(self, num_workers, tid):
+        self.num_sgd_workers = num_workers
+        self.acc_counter = 0
+        self.timeline = Timeline(tid)
+        # TODO(ekl) get this to work again so we get ray events
+        # self.timeline.patch_ray()
+
+    def initialize(self, shard_shape):
+        """Resets the gradient buffer to zeros."""
+        self.accumulated = np.zeros(shard_shape, dtype=np.float32)
+
+    def prefetch(self, oids):
+        """Tell plasma to prefetch the given object ids over the network."""
+        self.timeline.reset()
+        self.timeline.start("prefetch")
+        fetch(oids)
+        self.timeline.end("prefetch")
+
+    def add_spinwait(self, grad_shard_ids):
+        """Optimized version of add() that operates on multiple grads."""
+        self.timeline.start("add_spinwait")
+        plasma_ids = [ray.pyarrow.plasma.ObjectID(x) for x in grad_shard_ids]
+        while plasma_ids:
+            for p in plasma_ids:
+                if ray.worker.global_worker.plasma_client.contains(p):
+                    self.timeline.start("get_buffers")
+                    grads = ray.worker.global_worker.plasma_client.get(p)
+                    self.accumulated += grads
+                    self.acc_counter += 1
+                    self.timeline.end("get_buffers")
+                    plasma_ids.remove(p)
+                    break
+        self.timeline.end("add_spinwait")
+
+    def add(self, grad_shard_id):
+        """Add the given gradient value to the accumulated gradients."""
+        self.timeline.start("add")
+        self.timeline.start("get_buffers")
+        oid = ray.pyarrow.plasma.ObjectID(grad_shard_id)
+        grads = ray.worker.global_worker.plasma_client.get(oid)
+        self.timeline.end("get_buffers")
+        self.accumulated += grads
+        self.acc_counter += 1
+        self.timeline.end("add")
+
+    def get(self, object_id):
+        """Put the accumulated gradients to the given object id."""
+        self.timeline.start("get")
+        client = ray.worker.global_worker.plasma_client
+        assert self.acc_counter == self.num_sgd_workers, self.acc_counter
+        oid = ray.pyarrow.plasma.ObjectID(object_id)
+        client.put(self.accumulated.flatten(), object_id=oid)
+        self.accumulated = np.zeros_like(self.accumulated)
+        self.acc_counter = 0
+        self.timeline.end("get")
+
+    def get_timeline(self):
+        return self.timeline
+
+    def ip(self):
+        return ray.services.get_node_ip_address()
+
+    def warmup(self):
+        warmup()
diff --git a/python/ray/experimental/sgd/sgd.py b/python/ray/experimental/sgd/sgd.py
index c569c036f1b10..a663960683f79 100644
--- a/python/ray/experimental/sgd/sgd.py
+++ b/python/ray/experimental/sgd/sgd.py
@@ -7,338 +7,187 @@
 import time
 
 import numpy as np
-import pyarrow.plasma as plasma
-import tensorflow as tf
 
 import ray
-from ray.experimental.sgd.util import Timeline, fetch, run_timeline
-from ray.experimental.sgd.modified_allreduce import sum_gradients_all_reduce, \
-    unpack_small_tensors
+from ray.experimental.sgd.sgd_worker import SGDWorker
+from ray.experimental.sgd.param_server import ParameterServer
 
 logger = logging.getLogger(__name__)
 
 
-class SGDWorker(object):
+class DistributedSGD(object):
+    """Experimental distributed SGD implementation in Ray.
+
+    This supports two modes:
+        'simple': centralized gradient aggregation
+        'ps': sharded parameter-server implementation
+
+    To use this class, you'll have to implement model.py:Model.
+
+    Arguments:
+        model_creator (func): Function that returns a model given worker and
+            device indexes as arguments. Each model replica will be created
+            within its own variable scope.
+        num_workers (int): Number of Ray actors to use for SGD.
+        devices_per_worker (int): Number of GPU or CPU devices to use per
+            worker. One model replica will be created per device.
+        gpu (bool): Whether to use GPU devices.
+        strategy (str): Strategy to use for distributed gradient aggregation.
+            This only applies if num_workers > 1.
+        grad_shard_bytes (int): Fuse gradient tensors into chunks of at most
+            this size (if applicable).
+        all_reduce_alg (str): TensorFlow strategy to use for gradient
+            synchronization within the same worker (if applicable).
+            See modified_allreduce.py for options.
+
+    Examples:
+        >>> # Setup distributed SGD
+        >>> model_creator = (
+        ...   lambda worker_idx, device_idx: YourModelClass(...))
+        >>> sgd = DistributedSGD(
+        ...   model_creator, num_workers=2,
+        ...   devices_per_worker=4, gpu=True, strategy="ps")
+
+        >>> # To train
+        >>> for i in range(100):
+        ...   stats = sgd.step(fetch_stats=i % 10 == 0)
+
+        >>> # To access or update model state
+        >>> sgd.foreach_model(lambda model: ...)
+
+        >>> # To access or update worker state
+        >>> sgd.foreach_worker(lambda worker: ...)
+    """
+
     def __init__(self,
-                 worker_index,
                  model_creator,
-                 all_reduce_alg="simple",
-                 num_devices=1,
-                 use_cpus=False,
-                 max_bytes=60000000,
-                 plasma_op=False):
-        self.worker_index = worker_index
-        assert num_devices > 0
-
-        # TODO(ekl) support custom session
-        tf_session_args = {
-            "device_count": {
-                "CPU": num_devices
-            },
-            "log_device_placement": False,
-            "gpu_options": tf.GPUOptions(force_gpu_compatible=True),
-            "inter_op_parallelism_threads": 128,
-        }
-        config_proto = tf.ConfigProto(**tf_session_args)
-        self.sess = tf.Session(config=config_proto)
-        self.models = []
-        grad_ops = []
-
-        if use_cpus:
-            device_tmpl = "/cpu:%d"
+                 num_workers,
+                 devices_per_worker,
+                 gpu=True,
+                 strategy="ps",
+                 grad_shard_bytes=10000000,
+                 all_reduce_alg="simple"):
+
+        if num_workers == 1 and strategy == "ps":
+            logger.warn(
+                "The parameter server strategy does not make sense for single "
+                "worker operation, falling back to simple mode.")
+            strategy = "simple"
+
+        if strategy == "ps":
+            use_plasma_op = True
+        elif strategy == "simple":
+            use_plasma_op = False
+            grad_shard_bytes = 0  # tensor fusion doesn't make sense
         else:
-            device_tmpl = "/gpu:%d"
-        for device_idx in range(num_devices):
-            device = device_tmpl % device_idx
-            with tf.device(device):
-                with tf.variable_scope("device_%d" % device_idx):
-                    model = model_creator(worker_index, device_idx)
-                    self.models.append(model)
-                    model.grads = [
-                        t
-                        for t in model.optimizer.compute_gradients(model.loss)
-                        if t[0] is not None
-                    ]
-                    grad_ops.append(model.grads)
-
-        if num_devices == 1:
-            assert not max_bytes, "Not supported with 1 GPU"
-            self.packed_grads_and_vars = grad_ops
+            raise ValueError("strategy must be one of 'ps', 'simple'")
+        self.strategy = strategy
+
+        self.model_creator = model_creator
+        if gpu:
+            requests = {"num_gpus": devices_per_worker}
         else:
-            if max_bytes:
-                self.packed_grads_and_vars, packing_vals = (
-                    sum_gradients_all_reduce(
-                        "",
-                        grad_ops,
-                        1,
-                        all_reduce_alg,
-                        1,
-                        list(range(num_devices)),
-                        agg_small_grads_max_bytes=max_bytes))
-            else:
-                self.packed_grads_and_vars, _ = (sum_gradients_all_reduce(
-                    "",
-                    grad_ops,
-                    1,
-                    all_reduce_alg,
-                    1,
-                    list(range(num_devices)),
-                    agg_small_grads_max_bytes=0))
-        self.per_device_grads = [
-            list(zip(*dev_gv))[0] for dev_gv in self.packed_grads_and_vars
-        ]
-        assert (len(self.per_device_grads) == num_devices)
-        self.num_grads = num_grads = len(self.packed_grads_and_vars[0])
-        if max_bytes:
-            logger.info("Packed grads => {} tensors".format(num_grads))
-
-        # Ops for reading grads with the right control deps
-        nccl_noops = []
-        for j in range(num_grads)[::-1]:
-            deps = nccl_noops + [
-                dev_grad[j] for dev_grad in self.per_device_grads
-            ]
-            with tf.control_dependencies(deps):
-                nccl_noops = [tf.no_op()]
-
-        # You must fetch this otherwise the NCCL allreduce will hang
-        self.nccl_control_out = tf.group(*nccl_noops)
-
-        round_robin_devices = False
-        if plasma_op:
-            store_socket = (
-                ray.worker.global_worker.plasma_client.store_socket_name)
-            manager_socket = (
-                ray.worker.global_worker.plasma_client.manager_socket_name)
-            if not plasma.tf_plasma_op:
-                plasma.build_plasma_tensorflow_op()
-
-            # For fetching grads -> plasma
-            self.plasma_in_grads = []
-            self.plasma_in_grads_oids = [
-                tf.placeholder(shape=[], dtype=tf.string, name="in_grad_oids")
-                for _ in range(num_grads)
-            ]
-            ix = 0
-            for j in range(num_grads):
-                grad = self.per_device_grads[ix][j]
-                if round_robin_devices:
-                    ix += 1  # round robin assignment
-                ix %= num_devices
-                with tf.device(self.models[ix].loss.device):
-                    plasma_grad = plasma.tf_plasma_op.tensor_to_plasma(
-                        [grad],
-                        self.plasma_in_grads_oids[j],
-                        plasma_store_socket_name=store_socket,
-                        plasma_manager_socket_name=manager_socket)
-                self.plasma_in_grads.append(plasma_grad)
-
-            # For applying grads <- plasma
-            unpacked_gv = []
-            self.plasma_out_grads_oids = [
-                tf.placeholder(
-                    shape=[], dtype=tf.string, name="grad_out_oids")
-                for _ in range(num_grads)
+            requests = {"num_cpus": devices_per_worker}
+
+        RemoteSGDWorker = ray.remote(**requests)(SGDWorker)
+        self.workers = []
+        logger.info(
+            "Creating SGD workers ({} total, {} devices per worker)".format(
+                num_workers, devices_per_worker))
+        for worker_index in range(num_workers):
+            self.workers.append(
+                RemoteSGDWorker.remote(
+                    worker_index,
+                    model_creator,
+                    num_devices=devices_per_worker,
+                    plasma_op=use_plasma_op,
+                    gpu=gpu,
+                    max_bytes=grad_shard_bytes,
+                    all_reduce_alg=all_reduce_alg))
+
+        logger.info("Waiting for gradient configuration")
+        shard_shapes = ray.get(self.workers[0].shard_shapes.remote())
+
+        logger.info("Waiting for actors to start")
+        ray.get([w.shard_shapes.remote() for w in self.workers])
+
+        if strategy == "ps":
+            logger.info("Starting parameter servers ({} shards)".format(
+                len(shard_shapes)))
+            self.ps_list = [
+                ParameterServer.remote(len(self.workers), i)
+                for i, s in enumerate(shard_shapes)
             ]
-            packed_plasma_grads = []
-            ix = 0
-            for j in range(num_grads):
-                with tf.device(self.plasma_in_grads[j].device):
-                    with tf.control_dependencies([self.plasma_in_grads[j]]):
-                        grad_ph = plasma.tf_plasma_op.plasma_to_tensor(
-                            self.plasma_out_grads_oids[j],
-                            dtype=tf.float32,
-                            plasma_store_socket_name=store_socket,
-                            plasma_manager_socket_name=manager_socket)
-                grad_ph = tf.reshape(grad_ph,
-                                     self.packed_grads_and_vars[0][j][0].shape)
-                logger.debug("Packed tensor {}".format(grad_ph))
-                packed_plasma_grads.append(grad_ph)
-            for i in range(num_devices):
-                per_device = []
-                for j, (g, v) in enumerate(self.packed_grads_and_vars[i]):
-                    grad_ph = packed_plasma_grads[j]
-                    per_device.append((grad_ph, v))
-                unpacked_gv.append(per_device)
-
-            if max_bytes:
-                unpacked_gv = unpack_small_tensors(unpacked_gv, packing_vals)
-
-        elif max_bytes:
-            unpacked_gv = unpack_small_tensors(self.packed_grads_and_vars,
-                                               packing_vals)
+            ray.get([
+                ps.initialize.remote(s)
+                for ps, s in zip(self.ps_list, shard_shapes)
+            ])
+            logger.info("Parameter servers started")
         else:
-            unpacked_gv = self.packed_grads_and_vars
-
-        # Same shape as packed_grads_and_vars
-        assert len(unpacked_gv) == num_devices
-        assert len(unpacked_gv[0][0]) == 2
-
-        apply_ops = []
-        to_apply = unpacked_gv[0]
-        for ix, m in enumerate(self.models):
-            apply_ops.append(
-                m.optimizer.apply_gradients(
-                    [(g, v)
-                     for ((g, _), (_, v)) in zip(to_apply, unpacked_gv[ix])]))
-        self.apply_op = tf.group(*apply_ops)
-        init_op = tf.group(tf.global_variables_initializer(),
-                           tf.local_variables_initializer())
-        self.sess.run(init_op)
+            self.ps_list = []
+
+    def foreach_worker(self, fn):
+        """Apply the given function to each remote worker.
+
+        Returns:
+            List of results from applying the function.
+        """
+        results = ray.get([w.foreach_worker.remote(fn) for w in self.workers])
+        return results
 
     def foreach_model(self, fn):
-        return [fn(m) for m in self.models]
+        """Apply the given function to each model replica in each worker.
 
-    def foreach_worker(self, fn):
-        return fn(self)
-
-    def compute_gradients(self):
-        start = time.time()
-        feed_dict = {}
-        # Aggregate feed dicts for each model on this worker.
-        for model in self.models:
-            feed_dict.update(model.get_feed_dict())
-        # We only need to fetch the first per_device_grad, since they are
-        # averaged across all devices by allreduce.
-        fetches = self.sess.run(
-            [
-                self.models[0].loss, self.per_device_grads[0],
-                self.nccl_control_out
-            ],
-            feed_dict=feed_dict)
-        logger.debug(
-            "compute grad interior time {}".format(time.time() - start))
-        return fetches
-
-    def apply_gradients(self, avg_grads):
-        start = time.time()
-        result = {
-            g: avg_grads[i]
-            for (i, g) in enumerate(self.per_device_grads[0])
-        }
-        self.sess.run(self.apply_op, feed_dict=result)
-        logger.debug("apply grad interior time {}".format(time.time() - start))
-
-    def ps_compute_apply(self,
-                         out_grad_shard_oids,
-                         agg_grad_shard_oids,
-                         tl_name="ps_compute_apply",
-                         write_timeline=False):
-        feed_dict = {
-            ph: oid
-            for (ph,
-                 oid) in zip(self.plasma_in_grads_oids, out_grad_shard_oids)
-        }
-        feed_dict.update({
-            ph: oid
-            for (ph,
-                 oid) in zip(self.plasma_out_grads_oids, agg_grad_shard_oids)
-        })
-        fetch(agg_grad_shard_oids)
-        run_timeline(
-            self.sess,
-            [self.plasma_in_grads, self.apply_op, self.nccl_control_out],
-            feed_dict=feed_dict,
-            write_timeline=write_timeline)
-
-    def num_grad_shards(self):
-        return self.num_grads
-
-    def shard_shapes(self):
-        main_gv = self.packed_grads_and_vars[0]
-        return [g.shape for g, _ in main_gv]
-
-    def ip(self):
-        return ray.services.get_node_ip_address()
-
-
-class ParameterServer(object):
-    def __init__(self, num_workers, tid):
-        self.num_sgd_workers = num_workers
-        self.acc_counter = 0
-        self.timeline = Timeline(tid)
-        self.timeline.patch_ray()
-
-    def set_tid(self, tid):
-        self.timeline.tid = tid
-
-    def get_time(self):
-        return time.time() + self.timeline.offset
-
-    def set_time(self, ref_time):
-        self.timeline.offset = ref_time - time.time()
-
-    def initialize(self, shard_shape):
-        self.accumulated = np.zeros(shard_shape, dtype=np.float32)
-
-    def mark(self):
-        self.timeline.event("mark")
-
-    def prefetch(self, oids):
-        self.timeline.reset()
-        self.timeline.start("prefetch")
-        fetch(oids)
-        self.timeline.end("prefetch")
-
-    def add_spinwait(self, grad_shard_ids):
-        self.timeline.start("add_spinwait")
-        plasma_ids = [ray.pyarrow.plasma.ObjectID(x) for x in grad_shard_ids]
-        while plasma_ids:
-            for p in plasma_ids:
-                if ray.worker.global_worker.plasma_client.contains(p):
-                    self.timeline.start("get_buffers")
-                    grads = ray.worker.global_worker.plasma_client.get(p)
-                    self.accumulated += grads
-                    self.acc_counter += 1
-                    self.timeline.end("get_buffers")
-                    plasma_ids.remove(p)
-                    break
-        self.timeline.end("add_spinwait")
-
-    def add(self, grad_shard_id):
-        self.timeline.start("add")
-        self.timeline.start("get_buffers")
-        oid = ray.pyarrow.plasma.ObjectID(grad_shard_id)
-        grads = ray.worker.global_worker.plasma_client.get(oid)
-        self.timeline.end("get_buffers")
-        self.accumulated += grads
-        self.acc_counter += 1
-        self.timeline.end("add")
-
-    def get(self, object_id):
-        self.timeline.start("get")
-        client = ray.worker.global_worker.plasma_client
-        assert self.acc_counter == self.num_sgd_workers, self.acc_counter
-        oid = ray.pyarrow.plasma.ObjectID(object_id)
-        client.put(self.accumulate.flatten(), object_id=oid)
-        self.accumulated = np.zeros_like(self.accumulated)
-        self.acc_counter = 0
-        self.timeline.end("get")
-
-    def get_timeline(self):
-        return self.timeline
-
-    def ip(self):
-        return ray.services.get_node_ip_address()
-
-    def pin(self, cpu_id):
-        try:
-            import psutil
-            p = psutil.Process()
-            p.cpu_affinity([cpu_id])
-            logger.info("Setting CPU Affinity to: {}".format(cpu_id))
-        except Exception as e:
-            logger.error(e)
-
-
-def average_gradients(grads):
+        Returns:
+            List of results from applying the function.
+        """
+        results = ray.get([w.foreach_model.remote(fn) for w in self.workers])
+        out = []
+        for r in results:
+            out.extend(r)
+        return out
+
+    def for_model(self, fn):
+        """Apply the given function to a single model replica.
+
+        Returns:
+            Result from applying the function.
+        """
+        return ray.get(self.workers[0].for_model.remote(fn))
+
+    def step(self, fetch_stats=False):
+        """Run a single SGD step.
+
+        Arguments:
+            fetch_stats (bool): Whether to return stats from the step. This can
+                slow down the computation by acting as a global barrier.
+        """
+        if self.strategy == "ps":
+            return _distributed_sgd_step(
+                self.workers,
+                self.ps_list,
+                write_timeline=False,
+                fetch_stats=fetch_stats)
+        else:
+            return _simple_sgd_step(self.workers)
+
+    def warmup(self):
+        logger.info("Warming up object store of worker actors")
+        ray.get([w.warmup.remote() for w in self.workers])
+        logger.info("Warmup complete")
+
+
+def _average_gradients(grads):
     out = []
     for grad_list in zip(*grads):
         out.append(np.mean(grad_list, axis=0))
     return out
 
 
-def do_sgd_step(actors):
+def _simple_sgd_step(actors):
+    if len(actors) == 1:
+        return {"loss": ray.get(actors[0].compute_apply.remote())}
+
     start = time.time()
     fetches = ray.get([a.compute_gradients.remote() for a in actors])
     losses = [f[0] for f in fetches]
@@ -349,29 +198,33 @@ def do_sgd_step(actors):
         assert len(grads) == 1
         avg_grad = grads[0]
     else:
-        avg_grad = average_gradients(grads)
+        avg_grad = _average_gradients(grads)
         logger.debug("grad reduce time {}".format(time.time() - start))
     start = time.time()
     ray.get([a.apply_gradients.remote(avg_grad) for a in actors])
     logger.debug("apply all grads time {}".format(time.time() - start))
-    return np.mean(losses)
+    return {"loss": np.mean(losses)}
 
 
-def distributed_sgd_step(actors, ps_list, write_timeline):
+def _distributed_sgd_step(actors, ps_list, fetch_stats, write_timeline):
     # Preallocate object ids that actors will write gradient shards to
     grad_shard_oids_list = [[np.random.bytes(20) for _ in ps_list]
                             for _ in actors]
-    logger.info("generated grad oids")
+    logger.debug("Generated grad oids")
 
     # Preallocate object ids that param servers will write new weights to
     accum_shard_ids = [np.random.bytes(20) for _ in ps_list]
-    logger.info("generated accum oids")
+    logger.debug("Generated accum oids")
 
     # Kick off the fused compute grad / update weights tf run for each actor
+    losses = []
     for actor, grad_shard_oids in zip(actors, grad_shard_oids_list):
-        actor.ps_compute_apply.remote(
-            grad_shard_oids, accum_shard_ids, write_timeline=write_timeline)
-    logger.info("Launched all ps_compute_applys on all actors")
+        losses.append(
+            actor.ps_compute_apply.remote(
+                grad_shard_oids,
+                accum_shard_ids,
+                write_timeline=write_timeline))
+    logger.debug("Launched all ps_compute_applys on all actors")
 
     # Issue prefetch ops
     for j, (ps, weight_shard_oid) in list(
@@ -381,7 +234,7 @@ def distributed_sgd_step(actors, ps_list, write_timeline):
             to_fetch.append(grad_shard_oids[j])
         random.shuffle(to_fetch)
         ps.prefetch.remote(to_fetch)
-    logger.info("Launched all prefetch ops")
+    logger.debug("Launched all prefetch ops")
 
     # Aggregate the gradients produced by the actors. These operations
     # run concurrently with the actor methods above.
@@ -390,11 +243,11 @@ def distributed_sgd_step(actors, ps_list, write_timeline):
             enumerate(zip(ps_list, accum_shard_ids)))[::-1]:
         ps.add_spinwait.remote([gs[j] for gs in grad_shard_oids_list])
         ps_gets.append(ps.get.remote(weight_shard_oid))
-    logger.info("Launched all aggregate ops")
+    logger.debug("Launched all aggregate ops")
 
     if write_timeline:
         timelines = [ps.get_timeline.remote() for ps in ps_list]
-        logger.info("launched timeline gets")
+        logger.debug("Launched timeline gets")
         timelines = ray.get(timelines)
         t0 = timelines[0]
         for t in timelines[1:]:
@@ -403,44 +256,7 @@ def distributed_sgd_step(actors, ps_list, write_timeline):
     else:
         # Wait for at least the ps gets to finish
         ray.get(ps_gets)
-
-
-class DistributedSGD(object):
-    def __init__(self,
-                 model_creator,
-                 num_workers,
-                 devices_per_worker,
-                 use_cpus=False,
-                 use_plasma_op=False):
-        self.model_creator = model_creator
-        if use_cpus:
-            requests = {"num_cpus": devices_per_worker}
-        else:
-            requests = {"num_gpus": devices_per_worker}
-        RemoteSGDWorker = ray.remote(**requests)(SGDWorker)
-        self.workers = []
-        for worker_index in range(num_workers):
-            logger.info("Creating worker {}".format(worker_index))
-            self.workers.append(
-                RemoteSGDWorker.remote(
-                    worker_index,
-                    model_creator,
-                    num_devices=devices_per_worker,
-                    plasma_op=use_plasma_op,
-                    use_cpus=use_cpus))
-        assert not use_plasma_op, \
-            "TODO: when use_plasma_op is true, we must run in PS mode"
-
-    def foreach_worker(self, fn):
-        results = ray.get([w.foreach_worker.remote(fn) for w in self.workers])
-        return results
-
-    def foreach_model(self, fn):
-        results = ray.get([w.foreach_model.remote(fn) for w in self.workers])
-        out = []
-        for r in results:
-            out.extend(r)
-        return r
-
-    def step(self):
-        return do_sgd_step(self.workers)
+    if fetch_stats:
+        return {"loss": np.mean(ray.get(losses))}
+    else:
+        return None
diff --git a/python/ray/experimental/sgd/sgd_worker.py b/python/ray/experimental/sgd/sgd_worker.py
new file mode 100644
index 0000000000000..0d4b45c7c8bc4
--- /dev/null
+++ b/python/ray/experimental/sgd/sgd_worker.py
@@ -0,0 +1,268 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import logging
+import time
+
+import pyarrow.plasma as plasma
+import tensorflow as tf
+
+import ray
+from ray.experimental.sgd.util import fetch, run_timeline, warmup
+from ray.experimental.sgd.modified_allreduce import sum_gradients_all_reduce, \
+    unpack_small_tensors
+
+logger = logging.getLogger(__name__)
+
+
+class SGDWorker(object):
+    """Helper class for ray.experimental.sgd.DistributedSGD."""
+
+    def __init__(self,
+                 worker_index,
+                 model_creator,
+                 all_reduce_alg="simple",
+                 num_devices=1,
+                 gpu=False,
+                 max_bytes=10000000,
+                 plasma_op=False):
+        self.worker_index = worker_index
+        assert num_devices > 0
+
+        # TODO(ekl) support custom session
+        tf_session_args = {
+            "device_count": {
+                "CPU": num_devices
+            },
+            "log_device_placement": False,
+            "gpu_options": tf.GPUOptions(force_gpu_compatible=True),
+            "inter_op_parallelism_threads": 128,
+        }
+        config_proto = tf.ConfigProto(**tf_session_args)
+        self.sess = tf.Session(config=config_proto)
+        self.models = []
+        grad_ops = []
+
+        if gpu:
+            device_tmpl = "/gpu:%d"
+        else:
+            device_tmpl = "/cpu:%d"
+        with self.sess.as_default():
+            for device_idx in range(num_devices):
+                device = device_tmpl % device_idx
+                with tf.device(device):
+                    with tf.variable_scope("device_%d" % device_idx):
+                        model = model_creator(worker_index, device_idx)
+                        self.models.append(model)
+                        grads = [
+                            t for t in model.optimizer.compute_gradients(
+                                model.loss) if t[0] is not None
+                        ]
+                        grad_ops.append(grads)
+
+        if num_devices == 1:
+            if max_bytes:
+                raise ValueError(
+                    "Implementation limitation: grad_shard_bytes > 0 "
+                    "({}) currently requires > 1 device".format(max_bytes))
+            self.packed_grads_and_vars = grad_ops
+        else:
+            if max_bytes:
+                self.packed_grads_and_vars, packing_vals = (
+                    sum_gradients_all_reduce(
+                        "",
+                        grad_ops,
+                        1,
+                        all_reduce_alg,
+                        1,
+                        list(range(num_devices)),
+                        agg_small_grads_max_bytes=max_bytes))
+            else:
+                self.packed_grads_and_vars, _ = (sum_gradients_all_reduce(
+                    "",
+                    grad_ops,
+                    1,
+                    all_reduce_alg,
+                    1,
+                    list(range(num_devices)),
+                    agg_small_grads_max_bytes=0))
+        self.per_device_grads = [
+            list(zip(*dev_gv))[0] for dev_gv in self.packed_grads_and_vars
+        ]
+        assert (len(self.per_device_grads) == num_devices)
+        self.num_grads = num_grads = len(self.packed_grads_and_vars[0])
+        if max_bytes:
+            logger.info("Packed grads => {} tensors".format(num_grads))
+
+        # Ops for reading grads with the right control deps
+        nccl_noops = []
+        for j in range(num_grads)[::-1]:
+            deps = nccl_noops + [
+                dev_grad[j] for dev_grad in self.per_device_grads
+            ]
+            with tf.control_dependencies(deps):
+                nccl_noops = [tf.no_op()]
+
+        # You must fetch this otherwise the NCCL allreduce will hang
+        self.nccl_control_out = tf.group(*nccl_noops)
+
+        if plasma_op:
+            store_socket = (
+                ray.worker.global_worker.plasma_client.store_socket_name)
+            manager_socket = (
+                ray.worker.global_worker.plasma_client.manager_socket_name)
+            if not plasma.tf_plasma_op:
+                plasma.build_plasma_tensorflow_op()
+
+            # For fetching grads -> plasma
+            self.plasma_in_grads = []
+            self.plasma_in_grads_oids = [
+                tf.placeholder(shape=[], dtype=tf.string, name="in_grad_oids")
+                for _ in range(num_grads)
+            ]
+            for j in range(num_grads):
+                grad = self.per_device_grads[0][j]
+                with tf.device(self.models[0].loss.device):
+                    plasma_grad = plasma.tf_plasma_op.tensor_to_plasma(
+                        [grad],
+                        self.plasma_in_grads_oids[j],
+                        plasma_store_socket_name=store_socket,
+                        plasma_manager_socket_name=manager_socket)
+                self.plasma_in_grads.append(plasma_grad)
+
+            # For applying grads <- plasma
+            unpacked_gv = []
+            self.plasma_out_grads_oids = [
+                tf.placeholder(
+                    shape=[], dtype=tf.string, name="grad_out_oids")
+                for _ in range(num_grads)
+            ]
+            packed_plasma_grads = []
+            for j in range(num_grads):
+                with tf.device(self.plasma_in_grads[j].device):
+                    with tf.control_dependencies([self.plasma_in_grads[j]]):
+                        grad_ph = plasma.tf_plasma_op.plasma_to_tensor(
+                            self.plasma_out_grads_oids[j],
+                            dtype=tf.float32,
+                            plasma_store_socket_name=store_socket,
+                            plasma_manager_socket_name=manager_socket)
+                grad_ph = tf.reshape(grad_ph,
+                                     self.packed_grads_and_vars[0][j][0].shape)
+                logger.debug("Packed tensor {}".format(grad_ph))
+                packed_plasma_grads.append(grad_ph)
+            for i in range(num_devices):
+                per_device = []
+                for j, (g, v) in enumerate(self.packed_grads_and_vars[i]):
+                    grad_ph = packed_plasma_grads[j]
+                    per_device.append((grad_ph, v))
+                unpacked_gv.append(per_device)
+
+            if max_bytes:
+                unpacked_gv = unpack_small_tensors(unpacked_gv, packing_vals)
+
+        elif max_bytes:
+            unpacked_gv = unpack_small_tensors(self.packed_grads_and_vars,
+                                               packing_vals)
+        else:
+            unpacked_gv = self.packed_grads_and_vars
+
+        # Same shape as packed_grads_and_vars
+        assert len(unpacked_gv) == num_devices
+        assert len(unpacked_gv[0][0]) == 2
+
+        apply_ops = []
+        to_apply = unpacked_gv[0]
+        for ix, m in enumerate(self.models):
+            apply_ops.append(
+                m.optimizer.apply_gradients(
+                    [(g, v)
+                     for ((g, _), (_, v)) in zip(to_apply, unpacked_gv[ix])]))
+        self.apply_op = tf.group(*apply_ops)
+        init_op = tf.group(tf.global_variables_initializer(),
+                           tf.local_variables_initializer())
+        self.sess.run(init_op)
+
+    def _grad_feed_dict(self):
+        # Aggregate feed dicts for each model on this worker.
+        feed_dict = {}
+        for model in self.models:
+            feed_dict.update(model.get_feed_dict())
+        return feed_dict
+
+    def foreach_model(self, fn):
+        with self.sess.as_default():
+            return [fn(m) for m in self.models]
+
+    def foreach_worker(self, fn):
+        with self.sess.as_default():
+            return fn(self)
+
+    def for_model(self, fn):
+        with self.sess.as_default():
+            return fn(self.models[0])
+
+    def compute_gradients(self):
+        start = time.time()
+        feed_dict = self._grad_feed_dict()
+        # We only need to fetch the first per_device_grad, since they are
+        # averaged across all devices by allreduce.
+        fetches = self.sess.run(
+            [
+                self.models[0].loss, self.per_device_grads[0],
+                self.nccl_control_out
+            ],
+            feed_dict=feed_dict)
+        logger.debug(
+            "Compute grad interior time {}".format(time.time() - start))
+        return fetches
+
+    def apply_gradients(self, avg_grads):
+        start = time.time()
+        result = {
+            g: avg_grads[i]
+            for (i, g) in enumerate(self.per_device_grads[0])
+        }
+        self.sess.run(self.apply_op, feed_dict=result)
+        logger.debug("Apply grad interior time {}".format(time.time() - start))
+
+    def compute_apply(self):
+        fetches = run_timeline(
+            self.sess,
+            [self.models[0].loss, self.apply_op, self.nccl_control_out],
+            feed_dict=self._grad_feed_dict(),
+            name="compute_apply")
+        return fetches[0]
+
+    def ps_compute_apply(self,
+                         out_grad_shard_oids,
+                         agg_grad_shard_oids,
+                         tl_name="ps_compute_apply",
+                         write_timeline=False):
+        feed_dict = self._grad_feed_dict()
+        feed_dict.update(
+            dict(zip(self.plasma_in_grads_oids, out_grad_shard_oids)))
+        feed_dict.update(
+            dict(zip(self.plasma_out_grads_oids, agg_grad_shard_oids)))
+        fetch(agg_grad_shard_oids)
+        fetches = run_timeline(
+            self.sess, [
+                self.models[0].loss, self.plasma_in_grads, self.apply_op,
+                self.nccl_control_out
+            ],
+            feed_dict=feed_dict,
+            write_timeline=write_timeline)
+        return fetches[0]
+
+    def num_grad_shards(self):
+        return self.num_grads
+
+    def shard_shapes(self):
+        main_gv = self.packed_grads_and_vars[0]
+        return [g.shape for g, _ in main_gv]
+
+    def ip(self):
+        return ray.services.get_node_ip_address()
+
+    def warmup(self):
+        warmup()
diff --git a/python/ray/experimental/sgd/test_sgd.py b/python/ray/experimental/sgd/test_sgd.py
index d6369a4e00011..79e00b2656ba7 100755
--- a/python/ray/experimental/sgd/test_sgd.py
+++ b/python/ray/experimental/sgd/test_sgd.py
@@ -1,32 +1,67 @@
+#!/usr/bin/env python
+
 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 
 import argparse
+import time
 
 import ray
 from ray.experimental.sgd.tfbench.test_model import TFBenchModel
 from ray.experimental.sgd.sgd import DistributedSGD
 
 parser = argparse.ArgumentParser()
+parser.add_argument("--redis-address", default=None, type=str)
+parser.add_argument("--num-iters", default=10, type=int)
+parser.add_argument("--batch-size", default=1, type=int)
+parser.add_argument("--num-workers", default=2, type=int)
+parser.add_argument("--grad-shard-bytes", default=10000000, type=int)
+parser.add_argument("--devices-per-worker", default=2, type=int)
+parser.add_argument("--stats-interval", default=10, type=int)
+parser.add_argument("--all-reduce-alg", default="simple", type=str)
+parser.add_argument("--object-store-memory", default=None, type=int)
+parser.add_argument(
+    "--warmup", action="store_true", help="Warm up object store before start.")
 parser.add_argument(
-    "--num-iters", default=100, type=int, help="Number of iterations to run")
+    "--strategy", default="ps", type=str, help="One of 'simple' or 'ps'")
+parser.add_argument(
+    "--gpu", action="store_true", help="Use GPUs for optimization")
 
 if __name__ == "__main__":
-    ray.init()
-
     args, _ = parser.parse_known_args()
+    ray.init(
+        redis_address=args.redis_address,
+        object_store_memory=args.object_store_memory)
 
     model_creator = (
-        lambda worker_idx, device_idx: TFBenchModel(batch=1, use_cpus=True))
+        lambda worker_idx, device_idx: TFBenchModel(
+            batch=args.batch_size, use_cpus=not args.gpu))
 
     sgd = DistributedSGD(
         model_creator,
-        num_workers=2,
-        devices_per_worker=2,
-        use_cpus=True,
-        use_plasma_op=False)
-
-    for _ in range(args.num_iters):
-        loss = sgd.step()
-        print("Current loss", loss)
+        num_workers=args.num_workers,
+        devices_per_worker=args.devices_per_worker,
+        gpu=args.gpu,
+        strategy=args.strategy,
+        grad_shard_bytes=args.grad_shard_bytes,
+        all_reduce_alg=args.all_reduce_alg)
+
+    if args.warmup:
+        sgd.warmup()
+
+    t = []
+
+    for i in range(args.num_iters):
+        start = time.time()
+        fetch_stats = i % args.stats_interval == 0
+        print("== Step {} ==".format(i))
+        stats = sgd.step(fetch_stats=fetch_stats)
+        ips = ((args.batch_size * args.num_workers * args.devices_per_worker) /
+               (time.time() - start))
+        print("Iteration time", time.time() - start, "Images per second", ips)
+        t.append(ips)
+        if fetch_stats:
+            print("Current loss", stats)
+
+    print("Peak throughput", max(sum(t[i:i + 5]) / 5 for i in range(len(t))))
diff --git a/python/ray/experimental/sgd/tfbench/test_model.py b/python/ray/experimental/sgd/tfbench/test_model.py
index 0dd48607ef0a6..d866668f810d5 100644
--- a/python/ray/experimental/sgd/tfbench/test_model.py
+++ b/python/ray/experimental/sgd/tfbench/test_model.py
@@ -5,13 +5,14 @@
 import tensorflow as tf
 
 from tfbench import model_config
+from ray.experimental.sgd.model import Model
 
 
 class MockDataset():
     name = "synthetic"
 
 
-class TFBenchModel(object):
+class TFBenchModel(Model):
     def __init__(self, batch=64, use_cpus=False):
         image_shape = [batch, 224, 224, 3]
         labels_shape = [batch]
@@ -25,20 +26,22 @@ def __init__(self, batch=64, use_cpus=False):
             name='synthetic_images')
 
         # Minor hack to avoid H2D copy when using synthetic data
-        self.inputs = tf.contrib.framework.local_variable(
+        inputs = tf.contrib.framework.local_variable(
             images, name='gpu_cached_images')
-        self.labels = tf.random_uniform(
+        labels = tf.random_uniform(
             labels_shape,
             minval=0,
             maxval=999,
             dtype=tf.int32,
             name='synthetic_labels')
 
-        self.model = model_config.get_model_config("resnet101", MockDataset())
-        logits, aux = self.model.build_network(
-            self.inputs, data_format=use_cpus and "NHWC" or "NCHW")
+        model = model_config.get_model_config("resnet101", MockDataset())
+        logits, aux = model.build_network(
+            inputs, data_format=use_cpus and "NHWC" or "NCHW")
         loss = tf.nn.sparse_softmax_cross_entropy_with_logits(
-            logits=logits, labels=self.labels)
+            logits=logits, labels=labels)
+
+        # Implement model interface
         self.loss = tf.reduce_mean(loss, name='xentropy-loss')
         self.optimizer = tf.train.GradientDescentOptimizer(1e-6)
 
diff --git a/python/ray/experimental/sgd/util.py b/python/ray/experimental/sgd/util.py
index ca72bb5e9ef43..c8df01cb35b25 100644
--- a/python/ray/experimental/sgd/util.py
+++ b/python/ray/experimental/sgd/util.py
@@ -4,6 +4,7 @@
 
 import json
 import logging
+import numpy as np
 import os
 import time
 import tensorflow as tf
@@ -13,16 +14,29 @@
 logger = logging.getLogger(__name__)
 
 
+def warmup():
+    logger.info("Warming up object store")
+    zeros = np.zeros(int(100e6 / 8), dtype=np.float64)
+    start = time.time()
+    for _ in range(10):
+        ray.put(zeros)
+    logger.info("Initial latency for 100MB put {}".format(
+        (time.time() - start) / 10))
+    for _ in range(5):
+        for _ in range(100):
+            ray.put(zeros)
+        start = time.time()
+        for _ in range(10):
+            ray.put(zeros)
+        logger.info("Warmed up latency for 100MB put {}".format(
+            (time.time() - start) / 10))
+
+
 def fetch(oids):
-    if ray.global_state.use_raylet:
-        local_sched_client = ray.worker.global_worker.local_scheduler_client
-        for o in oids:
-            ray_obj_id = ray.ObjectID(o)
-            local_sched_client.reconstruct_objects([ray_obj_id], True)
-    else:
-        for o in oids:
-            plasma_id = ray.pyarrow.plasma.ObjectID(o)
-            ray.worker.global_worker.plasma_client.fetch([plasma_id])
+    local_sched_client = ray.worker.global_worker.local_scheduler_client
+    for o in oids:
+        ray_obj_id = ray.ObjectID(o)
+        local_sched_client.fetch_or_reconstruct([ray_obj_id], True)
 
 
 def run_timeline(sess, ops, feed_dict=None, write_timeline=False, name=""):
diff --git a/python/ray/experimental/state.py b/python/ray/experimental/state.py
index d91165637b609..d97cc274f76d6 100644
--- a/python/ray/experimental/state.py
+++ b/python/ray/experimental/state.py
@@ -2,12 +2,8 @@
 from __future__ import division
 from __future__ import print_function
 
-import copy
 from collections import defaultdict
-import heapq
 import json
-import numbers
-import os
 import redis
 import sys
 import time
@@ -18,25 +14,6 @@
 from ray.utils import (decode, binary_to_object_id, binary_to_hex,
                        hex_to_binary)
 
-# This mapping from integer to task state string must be kept up-to-date with
-# the scheduling_state enum in task.h.
-TASK_STATUS_WAITING = 1
-TASK_STATUS_SCHEDULED = 2
-TASK_STATUS_QUEUED = 4
-TASK_STATUS_RUNNING = 8
-TASK_STATUS_DONE = 16
-TASK_STATUS_LOST = 32
-TASK_STATUS_RECONSTRUCTING = 64
-TASK_STATUS_MAPPING = {
-    TASK_STATUS_WAITING: "WAITING",
-    TASK_STATUS_SCHEDULED: "SCHEDULED",
-    TASK_STATUS_QUEUED: "QUEUED",
-    TASK_STATUS_RUNNING: "RUNNING",
-    TASK_STATUS_DONE: "DONE",
-    TASK_STATUS_LOST: "LOST",
-    TASK_STATUS_RECONSTRUCTING: "RECONSTRUCTING",
-}
-
 
 class GlobalState(object):
     """A class used to interface with the Ray control state.
@@ -47,7 +24,6 @@ class GlobalState(object):
     Attributes:
         redis_client: The Redis client used to query the primary redis server.
         redis_clients: Redis clients for each of the Redis shards.
-        use_raylet: True if we are using the raylet code path.
     """
 
     def __init__(self):
@@ -57,8 +33,6 @@ def __init__(self):
         self.redis_client = None
         # Clients for the redis shards, storing the object table & task table.
         self.redis_clients = None
-        # True if we are using the raylet code path and false otherwise.
-        self.use_raylet = None
 
     def _check_connected(self):
         """Check that the object has been initialized before it is used.
@@ -78,6 +52,7 @@ def _check_connected(self):
     def _initialize_global_state(self,
                                  redis_ip_address,
                                  redis_port,
+                                 redis_password=None,
                                  timeout=20):
         """Initialize the GlobalState object by connecting to Redis.
 
@@ -89,9 +64,10 @@ def _initialize_global_state(self,
             redis_ip_address: The IP address of the node that the Redis server
                 lives on.
             redis_port: The port that the Redis server is listening on.
+            redis_password: The password of the redis server.
         """
         self.redis_client = redis.StrictRedis(
-            host=redis_ip_address, port=redis_port)
+            host=redis_ip_address, port=redis_port, password=redis_password)
 
         start_time = time.time()
 
@@ -128,22 +104,15 @@ def _initialize_global_state(self,
                             "ip_address_ports = {}".format(
                                 num_redis_shards, ip_address_ports))
 
-        use_raylet = self.redis_client.get("UseRaylet")
-        if use_raylet is not None:
-            self.use_raylet = int(use_raylet) == 1
-        elif os.environ.get("RAY_USE_XRAY") == "1":
-            # This environment variable is used in our testing setup.
-            print("Detected environment variable 'RAY_USE_XRAY'.")
-            self.use_raylet = True
-        else:
-            self.use_raylet = False
-
         # Get the rest of the information.
         self.redis_clients = []
         for ip_address_port in ip_address_ports:
             shard_address, shard_port = ip_address_port.split(b":")
             self.redis_clients.append(
-                redis.StrictRedis(host=shard_address, port=shard_port))
+                redis.StrictRedis(
+                    host=shard_address,
+                    port=shard_port,
+                    password=redis_password))
 
     def _execute_command(self, key, *args):
         """Execute a Redis command on the appropriate Redis shard based on key.
@@ -188,53 +157,29 @@ def _object_table(self, object_id):
             object_id = ray.ObjectID(hex_to_binary(object_id))
 
         # Return information about a single object ID.
-        if not self.use_raylet:
-            # Use the non-raylet code path.
-            object_locations = self._execute_command(
-                object_id, "RAY.OBJECT_TABLE_LOOKUP", object_id.id())
-            if object_locations is not None:
-                manager_ids = [
-                    binary_to_hex(manager_id)
-                    for manager_id in object_locations
-                ]
-            else:
-                manager_ids = None
-
-            result_table_response = self._execute_command(
-                object_id, "RAY.RESULT_TABLE_LOOKUP", object_id.id())
-            result_table_message = (
-                ray.gcs_utils.ResultTableReply.GetRootAsResultTableReply(
-                    result_table_response, 0))
-
-            result = {
-                "ManagerIDs": manager_ids,
-                "TaskID": binary_to_hex(result_table_message.TaskId()),
-                "IsPut": bool(result_table_message.IsPut()),
-                "DataSize": result_table_message.DataSize(),
-                "Hash": binary_to_hex(result_table_message.Hash())
-            }
+        message = self._execute_command(object_id, "RAY.TABLE_LOOKUP",
+                                        ray.gcs_utils.TablePrefix.OBJECT, "",
+                                        object_id.id())
+        gcs_entry = ray.gcs_utils.GcsTableEntry.GetRootAsGcsTableEntry(
+            message, 0)
 
-        else:
-            # Use the raylet code path.
-            message = self._execute_command(object_id, "RAY.TABLE_LOOKUP",
-                                            ray.gcs_utils.TablePrefix.OBJECT,
-                                            "", object_id.id())
-            result = []
-            gcs_entry = ray.gcs_utils.GcsTableEntry.GetRootAsGcsTableEntry(
-                message, 0)
-
-            for i in range(gcs_entry.EntriesLength()):
-                entry = ray.gcs_utils.ObjectTableData.GetRootAsObjectTableData(
-                    gcs_entry.Entries(i), 0)
-                object_info = {
-                    "DataSize": entry.ObjectSize(),
-                    "Manager": entry.Manager(),
-                    "IsEviction": entry.IsEviction(),
-                    "NumEvictions": entry.NumEvictions()
-                }
-                result.append(object_info)
+        assert gcs_entry.EntriesLength() > 0
 
-        return result
+        entry = ray.gcs_utils.ObjectTableData.GetRootAsObjectTableData(
+            gcs_entry.Entries(0), 0)
+
+        object_info = {
+            "DataSize": entry.ObjectSize(),
+            "Manager": entry.Manager(),
+            "IsEviction": [entry.IsEviction()],
+        }
+
+        for i in range(1, gcs_entry.EntriesLength()):
+            entry = ray.gcs_utils.ObjectTableData.GetRootAsObjectTableData(
+                gcs_entry.Entries(i), 0)
+            object_info["IsEviction"].append(entry.IsEviction())
+
+        return object_info
 
     def object_table(self, object_id=None):
         """Fetch and parse the object table info for one or more object IDs.
@@ -252,25 +197,12 @@ def object_table(self, object_id=None):
             return self._object_table(object_id)
         else:
             # Return the entire object table.
-            if not self.use_raylet:
-                object_info_keys = self._keys(
-                    ray.gcs_utils.OBJECT_INFO_PREFIX + "*")
-                object_location_keys = self._keys(
-                    ray.gcs_utils.OBJECT_LOCATION_PREFIX + "*")
-                object_ids_binary = set([
-                    key[len(ray.gcs_utils.OBJECT_INFO_PREFIX):]
-                    for key in object_info_keys
-                ] + [
-                    key[len(ray.gcs_utils.OBJECT_LOCATION_PREFIX):]
-                    for key in object_location_keys
-                ])
-            else:
-                object_keys = self._keys(
-                    ray.gcs_utils.TablePrefix_OBJECT_string + "*")
-                object_ids_binary = {
-                    key[len(ray.gcs_utils.TablePrefix_OBJECT_string):]
-                    for key in object_keys
-                }
+            object_keys = self._keys(ray.gcs_utils.TablePrefix_OBJECT_string +
+                                     "*")
+            object_ids_binary = {
+                key[len(ray.gcs_utils.TablePrefix_OBJECT_string):]
+                for key in object_keys
+            }
 
             results = {}
             for object_id_binary in object_ids_binary:
@@ -287,112 +219,49 @@ def _task_table(self, task_id):
 
         Returns:
             A dictionary with information about the task ID in question.
-                TASK_STATUS_MAPPING should be used to parse the "State" field
-                into a human-readable string.
         """
-        if not self.use_raylet:
-            # Use the non-raylet code path.
-            task_table_response = self._execute_command(
-                task_id, "RAY.TASK_TABLE_GET", task_id.id())
-            if task_table_response is None:
-                raise Exception("There is no entry for task ID {} in the task "
-                                "table.".format(binary_to_hex(task_id.id())))
-            task_table_message = ray.gcs_utils.TaskReply.GetRootAsTaskReply(
-                task_table_response, 0)
-            task_spec = task_table_message.TaskSpec()
-            task_spec = ray.local_scheduler.task_from_string(task_spec)
-
-            task_spec_info = {
-                "DriverID": binary_to_hex(task_spec.driver_id().id()),
-                "TaskID": binary_to_hex(task_spec.task_id().id()),
-                "ParentTaskID": binary_to_hex(task_spec.parent_task_id().id()),
-                "ParentCounter": task_spec.parent_counter(),
-                "ActorID": binary_to_hex(task_spec.actor_id().id()),
-                "ActorCreationID": binary_to_hex(
-                    task_spec.actor_creation_id().id()),
-                "ActorCreationDummyObjectID": binary_to_hex(
-                    task_spec.actor_creation_dummy_object_id().id()),
-                "ActorCounter": task_spec.actor_counter(),
-                "FunctionID": binary_to_hex(task_spec.function_id().id()),
-                "Args": task_spec.arguments(),
-                "ReturnObjectIDs": task_spec.returns(),
-                "RequiredResources": task_spec.required_resources()
-            }
-
-            execution_dependencies_message = (
-                ray.gcs_utils.TaskExecutionDependencies.
-                GetRootAsTaskExecutionDependencies(
-                    task_table_message.ExecutionDependencies(), 0))
-            execution_dependencies = [
-                ray.ObjectID(
-                    execution_dependencies_message.ExecutionDependencies(i))
-                for i in range(execution_dependencies_message.
-                               ExecutionDependenciesLength())
-            ]
-
-            # TODO(rkn): The return fields ExecutionDependenciesString and
-            # ExecutionDependencies are redundant, so we should remove
-            # ExecutionDependencies. However, it is currently used in
-            # monitor.py.
-
-            return {
-                "State": task_table_message.State(),
-                "LocalSchedulerID": binary_to_hex(
-                    task_table_message.LocalSchedulerId()),
-                "ExecutionDependenciesString": task_table_message.
-                ExecutionDependencies(),
-                "ExecutionDependencies": execution_dependencies,
-                "SpillbackCount": task_table_message.SpillbackCount(),
-                "TaskSpec": task_spec_info
-            }
-
-        else:
-            # Use the raylet code path.
-            message = self._execute_command(
-                task_id, "RAY.TABLE_LOOKUP",
-                ray.gcs_utils.TablePrefix.RAYLET_TASK, "", task_id.id())
-            gcs_entries = ray.gcs_utils.GcsTableEntry.GetRootAsGcsTableEntry(
-                message, 0)
-
-            info = []
-            for i in range(gcs_entries.EntriesLength()):
-                task_table_message = ray.gcs_utils.Task.GetRootAsTask(
-                    gcs_entries.Entries(i), 0)
-
-                execution_spec = task_table_message.TaskExecutionSpec()
-                task_spec = task_table_message.TaskSpecification()
-                task_spec = ray.local_scheduler.task_from_string(task_spec)
-                task_spec_info = {
-                    "DriverID": binary_to_hex(task_spec.driver_id().id()),
-                    "TaskID": binary_to_hex(task_spec.task_id().id()),
-                    "ParentTaskID": binary_to_hex(
-                        task_spec.parent_task_id().id()),
-                    "ParentCounter": task_spec.parent_counter(),
-                    "ActorID": binary_to_hex(task_spec.actor_id().id()),
-                    "ActorCreationID": binary_to_hex(
-                        task_spec.actor_creation_id().id()),
-                    "ActorCreationDummyObjectID": binary_to_hex(
-                        task_spec.actor_creation_dummy_object_id().id()),
-                    "ActorCounter": task_spec.actor_counter(),
-                    "FunctionID": binary_to_hex(task_spec.function_id().id()),
-                    "Args": task_spec.arguments(),
-                    "ReturnObjectIDs": task_spec.returns(),
-                    "RequiredResources": task_spec.required_resources()
-                }
+        message = self._execute_command(task_id, "RAY.TABLE_LOOKUP",
+                                        ray.gcs_utils.TablePrefix.RAYLET_TASK,
+                                        "", task_id.id())
+        gcs_entries = ray.gcs_utils.GcsTableEntry.GetRootAsGcsTableEntry(
+            message, 0)
 
-                info.append({
-                    "ExecutionSpec": {
-                        "Dependencies": [
-                            execution_spec.Dependencies(i)
-                            for i in range(execution_spec.DependenciesLength())
-                        ],
-                        "LastTimestamp": execution_spec.LastTimestamp(),
-                        "NumForwards": execution_spec.NumForwards()
-                    },
-                    "TaskSpec": task_spec_info
-                })
+        assert gcs_entries.EntriesLength() == 1
+
+        task_table_message = ray.gcs_utils.Task.GetRootAsTask(
+            gcs_entries.Entries(0), 0)
+
+        execution_spec = task_table_message.TaskExecutionSpec()
+        task_spec = task_table_message.TaskSpecification()
+        task_spec = ray.raylet.task_from_string(task_spec)
+        task_spec_info = {
+            "DriverID": binary_to_hex(task_spec.driver_id().id()),
+            "TaskID": binary_to_hex(task_spec.task_id().id()),
+            "ParentTaskID": binary_to_hex(task_spec.parent_task_id().id()),
+            "ParentCounter": task_spec.parent_counter(),
+            "ActorID": binary_to_hex(task_spec.actor_id().id()),
+            "ActorCreationID": binary_to_hex(
+                task_spec.actor_creation_id().id()),
+            "ActorCreationDummyObjectID": binary_to_hex(
+                task_spec.actor_creation_dummy_object_id().id()),
+            "ActorCounter": task_spec.actor_counter(),
+            "FunctionID": binary_to_hex(task_spec.function_id().id()),
+            "Args": task_spec.arguments(),
+            "ReturnObjectIDs": task_spec.returns(),
+            "RequiredResources": task_spec.required_resources()
+        }
 
-            return info
+        return {
+            "ExecutionSpec": {
+                "Dependencies": [
+                    execution_spec.Dependencies(i)
+                    for i in range(execution_spec.DependenciesLength())
+                ],
+                "LastTimestamp": execution_spec.LastTimestamp(),
+                "NumForwards": execution_spec.NumForwards()
+            },
+            "TaskSpec": task_spec_info
+        }
 
     def task_table(self, task_id=None):
         """Fetch and parse the task table information for one or more task IDs.
@@ -409,19 +278,12 @@ def task_table(self, task_id=None):
             task_id = ray.ObjectID(hex_to_binary(task_id))
             return self._task_table(task_id)
         else:
-            if not self.use_raylet:
-                task_table_keys = self._keys(ray.gcs_utils.TASK_PREFIX + "*")
-                task_ids_binary = [
-                    key[len(ray.gcs_utils.TASK_PREFIX):]
-                    for key in task_table_keys
-                ]
-            else:
-                task_table_keys = self._keys(
-                    ray.gcs_utils.TablePrefix_RAYLET_TASK_string + "*")
-                task_ids_binary = [
-                    key[len(ray.gcs_utils.TablePrefix_RAYLET_TASK_string):]
-                    for key in task_table_keys
-                ]
+            task_table_keys = self._keys(
+                ray.gcs_utils.TablePrefix_RAYLET_TASK_string + "*")
+            task_ids_binary = [
+                key[len(ray.gcs_utils.TablePrefix_RAYLET_TASK_string):]
+                for key in task_table_keys
+            ]
 
             results = {}
             for task_id_binary in task_ids_binary:
@@ -457,95 +319,54 @@ def client_table(self):
             Information about the Ray clients in the cluster.
         """
         self._check_connected()
-        if not self.use_raylet:
-            db_client_keys = self.redis_client.keys(
-                ray.gcs_utils.DB_CLIENT_PREFIX + "*")
-            node_info = {}
-            for key in db_client_keys:
-                client_info = self.redis_client.hgetall(key)
-                node_ip_address = decode(client_info[b"node_ip_address"])
-                if node_ip_address not in node_info:
-                    node_info[node_ip_address] = []
-                client_info_parsed = {}
-                assert b"client_type" in client_info
-                assert b"deleted" in client_info
-                assert b"ray_client_id" in client_info
-                for field, value in client_info.items():
-                    if field == b"node_ip_address":
-                        pass
-                    elif field == b"client_type":
-                        client_info_parsed["ClientType"] = decode(value)
-                    elif field == b"deleted":
-                        client_info_parsed["Deleted"] = bool(
-                            int(decode(value)))
-                    elif field == b"ray_client_id":
-                        client_info_parsed["DBClientID"] = binary_to_hex(value)
-                    elif field == b"manager_address":
-                        client_info_parsed["AuxAddress"] = decode(value)
-                    elif field == b"local_scheduler_socket_name":
-                        client_info_parsed["LocalSchedulerSocketName"] = (
-                            decode(value))
-                    elif client_info[b"client_type"] == b"local_scheduler":
-                        # The remaining fields are resource types.
-                        client_info_parsed[decode(field)] = float(
-                            decode(value))
-                    else:
-                        client_info_parsed[decode(field)] = decode(value)
-
-                node_info[node_ip_address].append(client_info_parsed)
-
-            return node_info
 
-        else:
-            # This is the raylet code path.
-            NIL_CLIENT_ID = ray_constants.ID_SIZE * b"\xff"
-            message = self.redis_client.execute_command(
-                "RAY.TABLE_LOOKUP", ray.gcs_utils.TablePrefix.CLIENT, "",
-                NIL_CLIENT_ID)
-
-            # Handle the case where no clients are returned. This should only
-            # occur potentially immediately after the cluster is started.
-            if message is None:
-                return []
-
-            node_info = {}
-            gcs_entry = ray.gcs_utils.GcsTableEntry.GetRootAsGcsTableEntry(
-                message, 0)
-
-            # Since GCS entries are append-only, we override so that
-            # only the latest entries are kept.
-            for i in range(gcs_entry.EntriesLength()):
-                client = (
-                    ray.gcs_utils.ClientTableData.GetRootAsClientTableData(
-                        gcs_entry.Entries(i), 0))
-
-                resources = {
-                    decode(client.ResourcesTotalLabel(i)):
-                    client.ResourcesTotalCapacity(i)
-                    for i in range(client.ResourcesTotalLabelLength())
-                }
-                client_id = ray.utils.binary_to_hex(client.ClientId())
-
-                # If this client is being removed, then it must
-                # have previously been inserted, and
-                # it cannot have previously been removed.
-                if not client.IsInsertion():
-                    assert client_id in node_info, "Client removed not found!"
-                    assert node_info[client_id]["IsInsertion"], (
-                        "Unexpected duplicate removal of client.")
-
-                node_info[client_id] = {
-                    "ClientID": client_id,
-                    "IsInsertion": client.IsInsertion(),
-                    "NodeManagerAddress": decode(client.NodeManagerAddress()),
-                    "NodeManagerPort": client.NodeManagerPort(),
-                    "ObjectManagerPort": client.ObjectManagerPort(),
-                    "ObjectStoreSocketName": decode(
-                        client.ObjectStoreSocketName()),
-                    "RayletSocketName": decode(client.RayletSocketName()),
-                    "Resources": resources
-                }
-            return list(node_info.values())
+        NIL_CLIENT_ID = ray_constants.ID_SIZE * b"\xff"
+        message = self.redis_client.execute_command(
+            "RAY.TABLE_LOOKUP", ray.gcs_utils.TablePrefix.CLIENT, "",
+            NIL_CLIENT_ID)
+
+        # Handle the case where no clients are returned. This should only
+        # occur potentially immediately after the cluster is started.
+        if message is None:
+            return []
+
+        node_info = {}
+        gcs_entry = ray.gcs_utils.GcsTableEntry.GetRootAsGcsTableEntry(
+            message, 0)
+
+        # Since GCS entries are append-only, we override so that
+        # only the latest entries are kept.
+        for i in range(gcs_entry.EntriesLength()):
+            client = (ray.gcs_utils.ClientTableData.GetRootAsClientTableData(
+                gcs_entry.Entries(i), 0))
+
+            resources = {
+                decode(client.ResourcesTotalLabel(i)):
+                client.ResourcesTotalCapacity(i)
+                for i in range(client.ResourcesTotalLabelLength())
+            }
+            client_id = ray.utils.binary_to_hex(client.ClientId())
+
+            # If this client is being removed, then it must
+            # have previously been inserted, and
+            # it cannot have previously been removed.
+            if not client.IsInsertion():
+                assert client_id in node_info, "Client removed not found!"
+                assert node_info[client_id]["IsInsertion"], (
+                    "Unexpected duplicate removal of client.")
+
+            node_info[client_id] = {
+                "ClientID": client_id,
+                "IsInsertion": client.IsInsertion(),
+                "NodeManagerAddress": decode(client.NodeManagerAddress()),
+                "NodeManagerPort": client.NodeManagerPort(),
+                "ObjectManagerPort": client.ObjectManagerPort(),
+                "ObjectStoreSocketName": decode(
+                    client.ObjectStoreSocketName()),
+                "RayletSocketName": decode(client.RayletSocketName()),
+                "Resources": resources
+            }
+        return list(node_info.values())
 
     def log_files(self):
         """Fetch and return a dictionary of log file names to outputs.
@@ -575,129 +396,6 @@ def log_files(self):
 
         return ip_filename_file
 
-    def task_profiles(self, num_tasks, start=None, end=None, fwd=True):
-        """Fetch and return a list of task profiles.
-
-        Args:
-            num_tasks: A limit on the number of tasks that task_profiles will
-                return.
-            start: The start point of the time window that is queried for
-                tasks.
-            end: The end point in time of the time window that is queried for
-                tasks.
-            fwd: If True, means that zrange will be used. If False, zrevrange.
-                This argument is only meaningful in conjunction with the
-                num_tasks argument. This controls whether the tasks returned
-                are the most recent or the least recent.
-
-        Returns:
-            A tuple of two elements. The first element is a dictionary mapping
-                the task ID of a task to a list of the profiling information
-                for all of the executions of that task. The second element is a
-                list of profiling information for tasks where the events have
-                no task ID.
-        """
-        task_info = {}
-        event_log_sets = self.redis_client.keys("event_log*")
-
-        # The heap is used to maintain the set of x tasks that occurred the
-        # most recently across all of the workers, where x is defined as the
-        # function parameter num. The key is the start time of the "get_task"
-        # component of each task. Calling heappop will result in the task with
-        # the earliest "get_task_start" to be removed from the heap.
-        heap = []
-        heapq.heapify(heap)
-        heap_size = 0
-
-        # Set up a param dict to pass the redis command
-        params = {"withscores": True}
-        if start is not None:
-            params["min"] = start
-        elif end is not None:
-            params["min"] = 0
-
-        if end is not None:
-            params["max"] = end
-        elif start is not None:
-            params["max"] = time.time()
-
-        if start is None and end is None:
-            params["end"] = num_tasks - 1
-        else:
-            params["num"] = num_tasks
-        params["start"] = 0
-
-        # Parse through event logs to determine task start and end points.
-        for event_log_set in event_log_sets:
-            if start is None and end is None:
-                if fwd:
-                    event_list = self.redis_client.zrange(
-                        event_log_set, **params)
-                else:
-                    event_list = self.redis_client.zrevrange(
-                        event_log_set, **params)
-            else:
-                if fwd:
-                    event_list = self.redis_client.zrangebyscore(
-                        event_log_set, **params)
-                else:
-                    event_list = self.redis_client.zrevrangebyscore(
-                        event_log_set, **params)
-
-            for (event, score) in event_list:
-                event_dict = json.loads(decode(event))
-                task_id = ""
-                for event in event_dict:
-                    if "task_id" in event[3]:
-                        task_id = event[3]["task_id"]
-                task_info[task_id] = {}
-                task_info[task_id]["score"] = score
-                # Add task to (min/max) heap by its start point.
-                # if fwd, we want to delete the largest elements, so -score
-                heapq.heappush(heap, (-score if fwd else score, task_id))
-                heap_size += 1
-
-                for event in event_dict:
-                    if event[1] == "get_task" and event[2] == 1:
-                        task_info[task_id]["get_task_start"] = event[0]
-                    if event[1] == "get_task" and event[2] == 2:
-                        task_info[task_id]["get_task_end"] = event[0]
-                    if (event[1] == "register_remote_function"
-                            and event[2] == 1):
-                        task_info[task_id]["import_remote_start"] = event[0]
-                    if (event[1] == "register_remote_function"
-                            and event[2] == 2):
-                        task_info[task_id]["import_remote_end"] = event[0]
-                    if (event[1] == "task:deserialize_arguments"
-                            and event[2] == 1):
-                        task_info[task_id]["get_arguments_start"] = event[0]
-                    if (event[1] == "task:deserialize_arguments"
-                            and event[2] == 2):
-                        task_info[task_id]["get_arguments_end"] = event[0]
-                    if event[1] == "task:execute" and event[2] == 1:
-                        task_info[task_id]["execute_start"] = event[0]
-                    if event[1] == "task:execute" and event[2] == 2:
-                        task_info[task_id]["execute_end"] = event[0]
-                    if event[1] == "task:store_outputs" and event[2] == 1:
-                        task_info[task_id]["store_outputs_start"] = event[0]
-                    if event[1] == "task:store_outputs" and event[2] == 2:
-                        task_info[task_id]["store_outputs_end"] = event[0]
-                    if "worker_id" in event[3]:
-                        task_info[task_id]["worker_id"] = event[3]["worker_id"]
-                    if "function_name" in event[3]:
-                        task_info[task_id]["function_name"] = (
-                            event[3]["function_name"])
-
-                if heap_size > num_tasks:
-                    min_task, task_id_hex = heapq.heappop(heap)
-                    del task_info[task_id_hex]
-                    heap_size -= 1
-
-        for key, info in task_info.items():
-            self._add_missing_timestamps(info)
-
-        return task_info
-
     def _profile_table(self, component_id):
         """Get the profile events for a given component.
 
@@ -748,10 +446,6 @@ def _profile_table(self, component_id):
         return profile_events
 
     def profile_table(self):
-        if not self.use_raylet:
-            raise Exception("This method is only supported in the raylet "
-                            "code path.")
-
         profile_table_keys = self._keys(
             ray.gcs_utils.TablePrefix_PROFILE_string + "*")
         component_identifiers_binary = [
@@ -765,24 +459,78 @@ def profile_table(self):
             for component_id in component_identifiers_binary
         }
 
-    def chrome_tracing_dump(self,
-                            include_task_data=False,
-                            filename=None,
-                            open_browser=False):
+    def _seconds_to_microseconds(self, time_in_seconds):
+        """A helper function for converting seconds to microseconds."""
+        time_in_microseconds = 10**6 * time_in_seconds
+        return time_in_microseconds
+
+    # Colors are specified at
+    # https://github.com/catapult-project/catapult/blob/master/tracing/tracing/base/color_scheme.html.  # noqa: E501
+    _default_color_mapping = defaultdict(
+        lambda: "generic_work", {
+            "worker_idle": "cq_build_abandoned",
+            "task": "rail_response",
+            "task:deserialize_arguments": "rail_load",
+            "task:execute": "rail_animation",
+            "task:store_outputs": "rail_idle",
+            "wait_for_function": "detailed_memory_dump",
+            "ray.get": "good",
+            "ray.put": "terrible",
+            "ray.wait": "vsync_highlight_color",
+            "submit_task": "background_memory_dump",
+            "fetch_and_run_function": "detailed_memory_dump",
+            "register_remote_function": "detailed_memory_dump",
+        })
+
+    # These colors are for use in Chrome tracing.
+    _chrome_tracing_colors = [
+        "thread_state_uninterruptible",
+        "thread_state_iowait",
+        "thread_state_running",
+        "thread_state_runnable",
+        "thread_state_sleeping",
+        "thread_state_unknown",
+        "background_memory_dump",
+        "light_memory_dump",
+        "detailed_memory_dump",
+        "vsync_highlight_color",
+        "generic_work",
+        "good",
+        "bad",
+        "terrible",
+        # "black",
+        # "grey",
+        # "white",
+        "yellow",
+        "olive",
+        "rail_response",
+        "rail_animation",
+        "rail_idle",
+        "rail_load",
+        "startup",
+        "heap_dump_stack_frame",
+        "heap_dump_object_type",
+        "heap_dump_child_node_arrow",
+        "cq_build_running",
+        "cq_build_passed",
+        "cq_build_failed",
+        "cq_build_abandoned",
+        "cq_build_attempt_runnig",
+        "cq_build_attempt_passed",
+        "cq_build_attempt_failed",
+    ]
+
+    def chrome_tracing_dump(self, filename=None):
         """Return a list of profiling events that can viewed as a timeline.
 
         To view this information as a timeline, simply dump it as a json file
-        using json.dumps, and then load go to chrome://tracing in the Chrome
-        web browser and load the dumped file. Make sure to enable "Flow events"
-        in the "View Options" menu.
+        by passing in "filename" or using using json.dump, and then load go to
+        chrome://tracing in the Chrome web browser and load the dumped file.
+        Make sure to enable "Flow events" in the "View Options" menu.
 
         Args:
-            include_task_data: If true, we will include more task metadata such
-                as the task specifications in the json.
             filename: If a filename is provided, the timeline is dumped to that
                 file.
-            open_browser: If true, we will attempt to automatically open the
-                timeline visualization in Chrome.
 
         Returns:
             If filename is not provided, this returns a list of profiling
@@ -793,38 +541,15 @@ def chrome_tracing_dump(self,
         # TODO(rkn): This should support viewing just a window of time or a
         # limited number of events.
 
-        if include_task_data:
-            raise NotImplementedError("This flag has not been implented yet.")
-
-        if open_browser:
-            raise NotImplementedError("This flag has not been implented yet.")
-
         profile_table = self.profile_table()
         all_events = []
 
-        # Colors are specified at
-        # https://github.com/catapult-project/catapult/blob/master/tracing/tracing/base/color_scheme.html.  # noqa: E501
-        default_color_mapping = defaultdict(
-            lambda: "generic_work", {
-                "get_task": "cq_build_abandoned",
-                "task": "rail_response",
-                "task:deserialize_arguments": "rail_load",
-                "task:execute": "rail_animation",
-                "task:store_outputs": "rail_idle",
-                "wait_for_function": "detailed_memory_dump",
-                "ray.get": "good",
-                "ray.put": "terrible",
-                "ray.wait": "vsync_highlight_color",
-                "submit_task": "background_memory_dump",
-                "fetch_and_run_function": "detailed_memory_dump",
-                "register_remote_function": "detailed_memory_dump",
-            })
-
-        def seconds_to_microseconds(time_in_seconds):
-            time_in_microseconds = 10**6 * time_in_seconds
-            return time_in_microseconds
-
         for component_id_hex, component_events in profile_table.items():
+            # Only consider workers and drivers.
+            component_type = component_events[0]["component_type"]
+            if component_type not in ["worker", "driver"]:
+                continue
+
             for event in component_events:
                 new_event = {
                     # The category of the event.
@@ -838,14 +563,14 @@ def seconds_to_microseconds(time_in_seconds):
                     "tid": event["component_type"] + ":" +
                     event["component_id"],
                     # The start time in microseconds.
-                    "ts": seconds_to_microseconds(event["start_time"]),
+                    "ts": self._seconds_to_microseconds(event["start_time"]),
                     # The duration in microseconds.
-                    "dur": seconds_to_microseconds(event["end_time"] -
-                                                   event["start_time"]),
+                    "dur": self._seconds_to_microseconds(event["end_time"] -
+                                                         event["start_time"]),
                     # What is this?
                     "ph": "X",
                     # This is the name of the color to display the box in.
-                    "cname": default_color_mapping[event["event_type"]],
+                    "cname": self._default_color_mapping[event["event_type"]],
                     # The extra user-defined data.
                     "args": event["extra_data"],
                 }
@@ -865,357 +590,96 @@ def seconds_to_microseconds(time_in_seconds):
         else:
             return all_events
 
-    def dump_catapult_trace(self,
-                            path,
-                            task_info,
-                            breakdowns=True,
-                            task_dep=True,
-                            obj_dep=True):
-        """Dump task profiling information to a file.
+    def chrome_tracing_object_transfer_dump(self, filename=None):
+        """Return a list of transfer events that can viewed as a timeline.
 
-        This information can be viewed as a timeline of profiling information
-        by going to chrome://tracing in the chrome web browser and loading the
-        appropriate file.
+        To view this information as a timeline, simply dump it as a json file
+        by passing in "filename" or using using json.dump, and then load go to
+        chrome://tracing in the Chrome web browser and load the dumped file.
+        Make sure to enable "Flow events" in the "View Options" menu.
 
         Args:
-            path: The filepath to dump the profiling information to.
-            task_info: The task info to use to generate the trace. Should be
-                the output of ray.global_state.task_profiles().
-            breakdowns: Boolean indicating whether to break down the tasks into
-                more fine-grained segments.
-            task_dep: Boolean indicating whether or not task submission edges
-                should be included in the trace.
-            obj_dep: Boolean indicating whether or not object dependency edges
-                should be included in the trace.
-        """
-        workers = self.workers()
-
-        task_table = {}
-        # TODO(ekl) reduce the number of RPCs here with MGET
-        for task_id, _ in task_info.items():
-            try:
-                # TODO (hme): do something to correct slider here,
-                # slider should be correct to begin with, though.
-                task_table[task_id] = self.task_table(task_id)
-                task_table[task_id]["TaskSpec"]["Args"] = [
-                    repr(arg)
-                    for arg in task_table[task_id]["TaskSpec"]["Args"]
-                ]
-            except Exception as e:
-                print("Could not find task {}".format(task_id))
-
-        # filter out tasks not in task_table
-        task_info = {k: v for k, v in task_info.items() if k in task_table}
-
-        start_time = None
-        for info in task_info.values():
-            task_start = min(self._get_times(info))
-            if not start_time or task_start < start_time:
-                start_time = task_start
-
-        def micros(ts):
-            return int(1e6 * ts)
-
-        def micros_rel(ts):
-            return micros(ts - start_time)
-
-        seen_obj = {}
-
-        full_trace = []
-        for task_id, info in task_info.items():
-            worker = workers[info["worker_id"]]
-            task_t_info = task_table[task_id]
-
-            # The total_info dictionary is what is displayed when selecting a
-            # task in the timeline. We copy the task spec so that we don't
-            # modify it in place since we will use the original values later.
-            total_info = copy.copy(task_table[task_id]["TaskSpec"])
-            total_info["Args"] = [
-                oid.hex() if isinstance(oid, ray.ObjectID) else oid
-                for oid in task_t_info["TaskSpec"]["Args"]
-            ]
-            total_info["ReturnObjectIDs"] = [
-                oid.hex() for oid in task_t_info["TaskSpec"]["ReturnObjectIDs"]
-            ]
-            total_info["LocalSchedulerID"] = task_t_info["LocalSchedulerID"]
-            total_info["get_arguments"] = (
-                info["get_arguments_end"] - info["get_arguments_start"])
-            total_info["execute"] = (
-                info["execute_end"] - info["execute_start"])
-            total_info["store_outputs"] = (
-                info["store_outputs_end"] - info["store_outputs_start"])
-            total_info["function_name"] = info["function_name"]
-            total_info["worker_id"] = info["worker_id"]
-
-            parent_info = task_info.get(
-                task_table[task_id]["TaskSpec"]["ParentTaskID"])
-            worker = workers[info["worker_id"]]
-            # The catapult trace format documentation can be found here:
-            # https://docs.google.com/document/d/1CvAClvFfyA5R-PhYUmn5OOQtYMH4h6I0nSsKchNAySU/preview  # noqa: E501
-            if breakdowns:
-                if "get_arguments_end" in info:
-                    get_args_trace = {
-                        "cat": "get_arguments",
-                        "pid": "Node " + worker["node_ip_address"],
-                        "tid": info["worker_id"],
-                        "id": task_id,
-                        "ts": micros_rel(info["get_arguments_start"]),
-                        "ph": "X",
-                        "name": info["function_name"] + ":get_arguments",
-                        "args": total_info,
-                        "dur": micros(info["get_arguments_end"] -
-                                      info["get_arguments_start"]),
-                        "cname": "rail_idle"
-                    }
-                    full_trace.append(get_args_trace)
-
-                if "store_outputs_end" in info:
-                    outputs_trace = {
-                        "cat": "store_outputs",
-                        "pid": "Node " + worker["node_ip_address"],
-                        "tid": info["worker_id"],
-                        "id": task_id,
-                        "ts": micros_rel(info["store_outputs_start"]),
-                        "ph": "X",
-                        "name": info["function_name"] + ":store_outputs",
-                        "args": total_info,
-                        "dur": micros(info["store_outputs_end"] -
-                                      info["store_outputs_start"]),
-                        "cname": "thread_state_runnable"
-                    }
-                    full_trace.append(outputs_trace)
-
-                if "execute_end" in info:
-                    execute_trace = {
-                        "cat": "execute",
-                        "pid": "Node " + worker["node_ip_address"],
-                        "tid": info["worker_id"],
-                        "id": task_id,
-                        "ts": micros_rel(info["execute_start"]),
-                        "ph": "X",
-                        "name": info["function_name"] + ":execute",
-                        "args": total_info,
-                        "dur": micros(info["execute_end"] -
-                                      info["execute_start"]),
-                        "cname": "rail_animation"
-                    }
-                    full_trace.append(execute_trace)
-
-            else:
-                if parent_info:
-                    parent_worker = workers[parent_info["worker_id"]]
-                    parent_times = self._get_times(parent_info)
-                    parent_profile = task_info.get(
-                        task_table[task_id]["TaskSpec"]["ParentTaskID"])
-
-                    _parent_id = parent_info["worker_id"] + str(
-                        micros(min(parent_times)))
-
-                    parent = {
-                        "cat": "submit_task",
-                        "pid": "Node " + parent_worker["node_ip_address"],
-                        "tid": parent_info["worker_id"],
-                        "ts": micros_rel(
-                            parent_profile
-                            and parent_profile["get_arguments_start"]
-                            or start_time),
-                        "ph": "s",
-                        "name": "SubmitTask",
-                        "args": {},
-                        "id": _parent_id,
-                    }
-                    full_trace.append(parent)
-
-                    _id = info["worker_id"] + str(micros(min(parent_times)))
-
-                    task_trace = {
-                        "cat": "submit_task",
-                        "pid": "Node " + worker["node_ip_address"],
-                        "tid": info["worker_id"],
-                        "ts": micros_rel(info["get_arguments_start"]),
-                        "ph": "f",
-                        "name": "SubmitTask",
-                        "args": {},
-                        "id": _id,
-                        "bp": "e",
-                        "cname": "olive"
-                    }
-                    full_trace.append(task_trace)
-
-                task = {
-                    "cat": "task",
-                    "pid": "Node " + worker["node_ip_address"],
-                    "tid": info["worker_id"],
-                    "id": task_id,
-                    "ts": micros_rel(info["get_arguments_start"]),
-                    "ph": "X",
-                    "name": info["function_name"],
-                    "args": total_info,
-                    "dur": micros(info["store_outputs_end"] -
-                                  info["get_arguments_start"]),
-                    "cname": "thread_state_runnable"
-                }
-                full_trace.append(task)
-
-            if task_dep:
-                if parent_info:
-                    parent_worker = workers[parent_info["worker_id"]]
-                    parent_times = self._get_times(parent_info)
-                    parent_profile = task_info.get(
-                        task_table[task_id]["TaskSpec"]["ParentTaskID"])
-
-                    _parent_id = parent_info["worker_id"] + str(
-                        micros(min(parent_times)))
-
-                    parent = {
-                        "cat": "submit_task",
-                        "pid": "Node " + parent_worker["node_ip_address"],
-                        "tid": parent_info["worker_id"],
-                        "ts": micros_rel(
-                            parent_profile
-                            and parent_profile["get_arguments_start"]
-                            or start_time),
-                        "ph": "s",
-                        "name": "SubmitTask",
-                        "args": {},
-                        "id": _parent_id,
-                    }
-                    full_trace.append(parent)
-
-                    _id = info["worker_id"] + str(micros(min(parent_times)))
-
-                    task_trace = {
-                        "cat": "submit_task",
-                        "pid": "Node " + worker["node_ip_address"],
-                        "tid": info["worker_id"],
-                        "ts": micros_rel(info["get_arguments_start"]),
-                        "ph": "f",
-                        "name": "SubmitTask",
-                        "args": {},
-                        "id": _id,
-                        "bp": "e"
-                    }
-                    full_trace.append(task_trace)
-
-            if obj_dep:
-                args = task_table[task_id]["TaskSpec"]["Args"]
-                for arg in args:
-                    # Don't visualize arguments that are not object IDs.
-                    if isinstance(arg, ray.ObjectID):
-                        object_info = self._object_table(arg)
-                        # Don't visualize objects that were created by calls to
-                        # put.
-                        if not object_info["IsPut"]:
-                            if arg not in seen_obj:
-                                seen_obj[arg] = 0
-                            seen_obj[arg] += 1
-                            owner_task = self._object_table(arg)["TaskID"]
-                            if owner_task in task_info:
-                                owner_worker = (workers[task_info[owner_task][
-                                    "worker_id"]])
-                                # Adding/subtracting 2 to the time associated
-                                # with the beginning/ending of the flow event
-                                # is necessary to make the flow events show up
-                                # reliably. When these times are exact, this is
-                                # presumably an edge case, and catapult doesn't
-                                # recognize that there is a duration event at
-                                # that exact point in time that the flow event
-                                # should be bound to. This issue is solved by
-                                # adding the 2 ms to the start/end time of the
-                                # flow event, which guarantees overlap with the
-                                # duration event that it's associated with, and
-                                # the flow event therefore always gets drawn.
-                                owner = {
-                                    "cat": "obj_dependency",
-                                    "pid": ("Node " +
-                                            owner_worker["node_ip_address"]),
-                                    "tid": task_info[owner_task]["worker_id"],
-                                    "ts": micros_rel(task_info[owner_task]
-                                                     ["store_outputs_end"]) -
-                                    2,
-                                    "ph": "s",
-                                    "name": "ObjectDependency",
-                                    "args": {},
-                                    "bp": "e",
-                                    "cname": "cq_build_attempt_failed",
-                                    "id": "obj" + str(arg) + str(seen_obj[arg])
-                                }
-                                full_trace.append(owner)
-
-                            dependent = {
-                                "cat": "obj_dependency",
-                                "pid": "Node " + worker["node_ip_address"],
-                                "tid": info["worker_id"],
-                                "ts": micros_rel(info["get_arguments_start"]) +
-                                2,
-                                "ph": "f",
-                                "name": "ObjectDependency",
-                                "args": {},
-                                "cname": "cq_build_attempt_failed",
-                                "bp": "e",
-                                "id": "obj" + str(arg) + str(seen_obj[arg])
-                            }
-                            full_trace.append(dependent)
-
-        print("Creating JSON {}/{}".format(len(full_trace), len(task_info)))
-        with open(path, "w") as outfile:
-            json.dump(full_trace, outfile)
-
-    def _get_times(self, data):
-        """Extract the numerical times from a task profile.
-
-        This is a helper method for dump_catapult_trace.
+            filename: If a filename is provided, the timeline is dumped to that
+                file.
 
-        Args:
-            data: This must be a value in the dictionary returned by the
-                task_profiles function.
-        """
-        all_times = []
-        all_times.append(data["acquire_lock_start"])
-        all_times.append(data["acquire_lock_end"])
-        all_times.append(data["get_arguments_start"])
-        all_times.append(data["get_arguments_end"])
-        all_times.append(data["execute_start"])
-        all_times.append(data["execute_end"])
-        all_times.append(data["store_outputs_start"])
-        all_times.append(data["store_outputs_end"])
-        return all_times
-
-    def _add_missing_timestamps(self, info):
-        """Fills in any missing timestamp values in a task info.
-
-        Task timestamps may be missing if the task fails or is partially
-        executed.
+        Returns:
+            If filename is not provided, this returns a list of profiling
+                events. Each profile event is a dictionary.
         """
+        client_id_to_address = {}
+        for client_info in ray.global_state.client_table():
+            client_id_to_address[client_info["ClientID"]] = "{}:{}".format(
+                client_info["NodeManagerAddress"],
+                client_info["ObjectManagerPort"])
 
-        keys = [
-            "acquire_lock_start", "acquire_lock_end", "get_arguments_start",
-            "get_arguments_end", "execute_start", "execute_end",
-            "store_outputs_start", "store_outputs_end"
-        ]
+        all_events = []
+
+        for key, items in self.profile_table().items():
+            # Only consider object manager events.
+            if items[0]["component_type"] != "object_manager":
+                continue
 
-        latest_timestamp = 0
-        for key in keys:
-            cur = info.get(key, latest_timestamp)
-            info[key] = cur
-            latest_timestamp = cur
+            for event in items:
+                if event["event_type"] == "transfer_send":
+                    object_id, remote_client_id, _, _ = event["extra_data"]
 
-    def local_schedulers(self):
-        """Get a list of live local schedulers.
+                elif event["event_type"] == "transfer_receive":
+                    object_id, remote_client_id, _, _ = event["extra_data"]
 
-        Returns:
-            A list of the live local schedulers.
-        """
-        if self.use_raylet:
-            raise Exception("The local_schedulers() method is deprecated.")
-        clients = self.client_table()
-        local_schedulers = []
-        for ip_address, client_list in clients.items():
-            for client in client_list:
-                if (client["ClientType"] == "local_scheduler"
-                        and not client["Deleted"]):
-                    local_schedulers.append(client)
-        return local_schedulers
+                elif event["event_type"] == "receive_pull_request":
+                    object_id, remote_client_id = event["extra_data"]
+
+                else:
+                    assert False, "This should be unreachable."
+
+                # Choose a color by reading the first couple of hex digits of
+                # the object ID as an integer and turning that into a color.
+                object_id_int = int(object_id[:2], 16)
+                color = self._chrome_tracing_colors[object_id_int % len(
+                    self._chrome_tracing_colors)]
+
+                new_event = {
+                    # The category of the event.
+                    "cat": event["event_type"],
+                    # The string displayed on the event.
+                    "name": event["event_type"],
+                    # The identifier for the group of rows that the event
+                    # appears in.
+                    "pid": client_id_to_address[key],
+                    # The identifier for the row that the event appears in.
+                    "tid": client_id_to_address[remote_client_id],
+                    # The start time in microseconds.
+                    "ts": self._seconds_to_microseconds(event["start_time"]),
+                    # The duration in microseconds.
+                    "dur": self._seconds_to_microseconds(event["end_time"] -
+                                                         event["start_time"]),
+                    # What is this?
+                    "ph": "X",
+                    # This is the name of the color to display the box in.
+                    "cname": color,
+                    # The extra user-defined data.
+                    "args": event["extra_data"],
+                }
+                all_events.append(new_event)
+
+                # Add another box with a color indicating whether it was a send
+                # or a receive event.
+                if event["event_type"] == "transfer_send":
+                    additional_event = new_event.copy()
+                    additional_event["cname"] = "black"
+                    all_events.append(additional_event)
+                elif event["event_type"] == "transfer_receive":
+                    additional_event = new_event.copy()
+                    additional_event["cname"] = "grey"
+                    all_events.append(additional_event)
+                else:
+                    pass
+
+        if filename is not None:
+            with open(filename, "w") as outfile:
+                json.dump(all_events, outfile)
+        else:
+            return all_events
 
     def workers(self):
         """Get a dictionary mapping worker ID to worker information."""
@@ -1227,11 +691,7 @@ def workers(self):
             worker_id = binary_to_hex(worker_key[len("Workers:"):])
 
             workers_data[worker_id] = {
-                "local_scheduler_socket": (decode(
-                    worker_info[b"local_scheduler_socket"])),
                 "node_ip_address": decode(worker_info[b"node_ip_address"]),
-                "plasma_manager_socket": decode(
-                    worker_info[b"plasma_manager_socket"]),
                 "plasma_store_socket": decode(
                     worker_info[b"plasma_store_socket"])
             }
@@ -1291,28 +751,28 @@ def cluster_resources(self):
                 resource in the cluster.
         """
         resources = defaultdict(int)
-        if not self.use_raylet:
-            local_schedulers = self.local_schedulers()
-
-            for local_scheduler in local_schedulers:
-                for key, value in local_scheduler.items():
-                    if key not in [
-                            "ClientType", "Deleted", "DBClientID",
-                            "AuxAddress", "LocalSchedulerSocketName"
-                    ]:
-                        resources[key] += value
-
-        else:
-            clients = self.client_table()
-            for client in clients:
+        clients = self.client_table()
+        for client in clients:
+            # Only count resources from live clients.
+            if client["IsInsertion"]:
                 for key, value in client["Resources"].items():
                     resources[key] += value
 
         return dict(resources)
 
+    def _live_client_ids(self):
+        """Returns a set of client IDs corresponding to clients still alive."""
+        return {
+            client["ClientID"]
+            for client in self.client_table() if client["IsInsertion"]
+        }
+
     def available_resources(self):
         """Get the current available cluster resources.
 
+        This is different from `cluster_resources` in that this will return
+        idle (available) resources rather than total resources.
+
         Note that this information can grow stale as tasks start and finish.
 
         Returns:
@@ -1321,97 +781,48 @@ def available_resources(self):
         """
         available_resources_by_id = {}
 
-        if not self.use_raylet:
-            subscribe_client = self.redis_client.pubsub()
-            subscribe_client.subscribe(
-                ray.gcs_utils.LOCAL_SCHEDULER_INFO_CHANNEL)
+        subscribe_clients = [
+            redis_client.pubsub(ignore_subscribe_messages=True)
+            for redis_client in self.redis_clients
+        ]
+        for subscribe_client in subscribe_clients:
+            subscribe_client.subscribe(ray.gcs_utils.XRAY_HEARTBEAT_CHANNEL)
 
-            local_scheduler_ids = {
-                local_scheduler["DBClientID"]
-                for local_scheduler in self.local_schedulers()
-            }
+        client_ids = self._live_client_ids()
 
-            while set(available_resources_by_id.keys()) != local_scheduler_ids:
+        while set(available_resources_by_id.keys()) != client_ids:
+            for subscribe_client in subscribe_clients:
+                # Parse client message
                 raw_message = subscribe_client.get_message()
-                if raw_message is None:
+                if (raw_message is None or raw_message["channel"] !=
+                        ray.gcs_utils.XRAY_HEARTBEAT_CHANNEL):
                     continue
                 data = raw_message["data"]
-                # Ignore subscribtion success message from Redis
-                # This is a long in python 2 and an int in python 3
-                if isinstance(data, numbers.Number):
-                    continue
-                message = (ray.gcs_utils.LocalSchedulerInfoMessage.
-                           GetRootAsLocalSchedulerInfoMessage(data, 0))
-                num_resources = message.DynamicResourcesLength()
+                gcs_entries = (
+                    ray.gcs_utils.GcsTableEntry.GetRootAsGcsTableEntry(
+                        data, 0))
+                heartbeat_data = gcs_entries.Entries(0)
+                message = (ray.gcs_utils.HeartbeatTableData.
+                           GetRootAsHeartbeatTableData(heartbeat_data, 0))
+                # Calculate available resources for this client
+                num_resources = message.ResourcesAvailableLabelLength()
                 dynamic_resources = {}
                 for i in range(num_resources):
-                    dyn = message.DynamicResources(i)
-                    resource_id = decode(dyn.Key())
-                    dynamic_resources[resource_id] = dyn.Value()
+                    resource_id = decode(message.ResourcesAvailableLabel(i))
+                    dynamic_resources[resource_id] = (
+                        message.ResourcesAvailableCapacity(i))
 
-                # Update available resources for this local scheduler
-                client_id = binary_to_hex(message.DbClientId())
+                # Update available resources for this client
+                client_id = ray.utils.binary_to_hex(message.ClientId())
                 available_resources_by_id[client_id] = dynamic_resources
 
-                # Update local schedulers in cluster
-                local_scheduler_ids = {
-                    local_scheduler["DBClientID"]
-                    for local_scheduler in self.local_schedulers()
-                }
-
-                # Remove disconnected local schedulers
-                for local_scheduler_id in available_resources_by_id.keys():
-                    if local_scheduler_id not in local_scheduler_ids:
-                        del available_resources_by_id[local_scheduler_id]
-        else:
-            # Assumes the number of Redis clients does not change
-            subscribe_clients = [
-                redis_client.pubsub(ignore_subscribe_messages=True)
-                for redis_client in self.redis_clients
-            ]
-            for subscribe_client in subscribe_clients:
-                subscribe_client.subscribe(
-                    ray.gcs_utils.XRAY_HEARTBEAT_CHANNEL)
-
-            client_ids = {client["ClientID"] for client in self.client_table()}
-
-            while set(available_resources_by_id.keys()) != client_ids:
-                for subscribe_client in subscribe_clients:
-                    # Parse client message
-                    raw_message = subscribe_client.get_message()
-                    if (raw_message is None or raw_message["channel"] !=
-                            ray.gcs_utils.XRAY_HEARTBEAT_CHANNEL):
-                        continue
-                    data = raw_message["data"]
-                    gcs_entries = (
-                        ray.gcs_utils.GcsTableEntry.GetRootAsGcsTableEntry(
-                            data, 0))
-                    heartbeat_data = gcs_entries.Entries(0)
-                    message = (ray.gcs_utils.HeartbeatTableData.
-                               GetRootAsHeartbeatTableData(heartbeat_data, 0))
-                    # Calculate available resources for this client
-                    num_resources = message.ResourcesAvailableLabelLength()
-                    dynamic_resources = {}
-                    for i in range(num_resources):
-                        resource_id = decode(
-                            message.ResourcesAvailableLabel(i))
-                        dynamic_resources[resource_id] = (
-                            message.ResourcesAvailableCapacity(i))
-
-                    # Update available resources for this client
-                    client_id = ray.utils.binary_to_hex(message.ClientId())
-                    available_resources_by_id[client_id] = dynamic_resources
-
-                # Update clients in cluster
-                client_ids = {
-                    client["ClientID"]
-                    for client in self.client_table()
-                }
+            # Update clients in cluster
+            client_ids = self._live_client_ids()
 
-                # Remove disconnected clients
-                for client_id in available_resources_by_id.keys():
-                    if client_id not in client_ids:
-                        del available_resources_by_id[client_id]
+            # Remove disconnected clients
+            for client_id in available_resources_by_id.keys():
+                if client_id not in client_ids:
+                    del available_resources_by_id[client_id]
 
         # Calculate total available resources
         total_available_resources = defaultdict(int)
@@ -1464,10 +875,6 @@ def error_messages(self, job_id=None):
             A dictionary mapping job ID to a list of the error messages for
                 that job.
         """
-        if not self.use_raylet:
-            raise Exception("The error_messages method is only supported in "
-                            "the raylet code path.")
-
         if job_id is not None:
             return self._error_messages(job_id)
 
diff --git a/python/ray/experimental/test/async_test.py b/python/ray/experimental/test/async_test.py
new file mode 100644
index 0000000000000..bdf45f77e8282
--- /dev/null
+++ b/python/ray/experimental/test/async_test.py
@@ -0,0 +1,150 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import asyncio
+import time
+
+import pytest
+
+import ray
+from ray.experimental import async_api
+
+
+@pytest.fixture
+def init():
+    ray.init(num_cpus=4)
+    async_api.init()
+    asyncio.get_event_loop().set_debug(False)
+    yield
+    async_api.shutdown()
+    ray.shutdown()
+
+
+def gen_tasks(time_scale=0.1):
+    @ray.remote
+    def f(n):
+        time.sleep(n * time_scale)
+        return n
+
+    tasks = [f.remote(i) for i in range(5)]
+    return tasks
+
+
+def test_simple(init):
+    @ray.remote
+    def f():
+        time.sleep(1)
+        return {"key1": ["value"]}
+
+    future = async_api.as_future(f.remote())
+    result = asyncio.get_event_loop().run_until_complete(future)
+    assert result["key1"] == ["value"]
+
+
+def test_gather(init):
+    loop = asyncio.get_event_loop()
+    tasks = gen_tasks()
+    futures = [async_api.as_future(obj_id) for obj_id in tasks]
+    results = loop.run_until_complete(asyncio.gather(*futures))
+    assert all(a == b for a, b in zip(results, ray.get(tasks)))
+
+
+def test_gather_benchmark(init):
+    @ray.remote
+    def f(n):
+        time.sleep(0.001 * n)
+        return 42
+
+    async def test_async():
+        sum_time = 0.
+        for _ in range(50):
+            tasks = [f.remote(n) for n in range(20)]
+            start = time.time()
+            futures = [async_api.as_future(obj_id) for obj_id in tasks]
+            await asyncio.gather(*futures)
+            sum_time += time.time() - start
+        return sum_time
+
+    def baseline():
+        sum_time = 0.
+        for _ in range(50):
+            tasks = [f.remote(n) for n in range(20)]
+            start = time.time()
+            ray.get(tasks)
+            sum_time += time.time() - start
+        return sum_time
+
+    # warm up
+    baseline()
+    # async get
+    sum_time_1 = asyncio.get_event_loop().run_until_complete(test_async())
+    # get
+    sum_time_2 = baseline()
+
+    # Ensure the new implementation is not too slow.
+    assert sum_time_2 * 1.2 > sum_time_1
+
+
+def test_wait(init):
+    loop = asyncio.get_event_loop()
+    tasks = gen_tasks()
+    futures = [async_api.as_future(obj_id) for obj_id in tasks]
+    results, _ = loop.run_until_complete(asyncio.wait(futures))
+    assert set(results) == set(futures)
+
+
+def test_wait_timeout(init):
+    loop = asyncio.get_event_loop()
+    tasks = gen_tasks(10)
+    futures = [async_api.as_future(obj_id) for obj_id in tasks]
+    fut = asyncio.wait(futures, timeout=5)
+    results, _ = loop.run_until_complete(fut)
+    assert list(results)[0] == futures[0]
+
+
+def test_gather_mixup(init):
+    loop = asyncio.get_event_loop()
+
+    @ray.remote
+    def f(n):
+        time.sleep(n * 0.1)
+        return n
+
+    async def g(n):
+        await asyncio.sleep(n * 0.1)
+        return n
+
+    tasks = [
+        async_api.as_future(f.remote(1)),
+        g(2),
+        async_api.as_future(f.remote(3)),
+        g(4)
+    ]
+    results = loop.run_until_complete(asyncio.gather(*tasks))
+    assert results == [1, 2, 3, 4]
+
+
+def test_wait_mixup(init):
+    loop = asyncio.get_event_loop()
+
+    @ray.remote
+    def f(n):
+        time.sleep(n)
+        return n
+
+    def g(n):
+        async def _g(_n):
+            await asyncio.sleep(_n)
+            return _n
+
+        return asyncio.ensure_future(_g(n))
+
+    tasks = [
+        async_api.as_future(f.remote(0.1)),
+        g(7),
+        async_api.as_future(f.remote(5)),
+        g(2)
+    ]
+    ready, _ = loop.run_until_complete(asyncio.wait(tasks, timeout=4))
+    assert set(ready) == {tasks[0], tasks[-1]}
diff --git a/python/ray/experimental/ui.py b/python/ray/experimental/ui.py
index da4ee9e57c838..15a6fd05f839d 100644
--- a/python/ray/experimental/ui.py
+++ b/python/ray/experimental/ui.py
@@ -1,20 +1,23 @@
-import ipywidgets as widgets
+import logging
 import numpy as np
 import os
 import pprint
-import ray
 import shutil
 import tempfile
 import time
 
+import ipywidgets as widgets
 from IPython.display import display, IFrame, clear_output
 
+import ray
+
+logger = logging.getLogger(__name__)
+
+
 # Instances of this class maintains keep track of whether or not a
 # callback is currently executing. Since the execution of the callback
 # may trigger more calls to the callback, this is used to prevent infinite
 # recursions.
-
-
 class _EventRecursionContextManager(object):
     def __init__(self):
         self.should_recurse = True
@@ -185,36 +188,6 @@ def update_wrapper(event):
                         range_slider.value = (100 + int(
                             100 * float(num_tasks_box.value) / num_tasks), 100)
 
-                if not update:
-                    return
-
-                diff = largest - smallest
-
-                # Low and high are used to scale the times that are
-                # queried to be relative to the absolute time.
-                low, high = map(lambda x: x / 100., range_slider.value)
-
-                # Queries to task_profiles based on the slider and text
-                # box values.
-                # (Querying based on the % total amount of time.)
-                if breakdown_opt.value == total_time_value:
-                    tasks = _truncated_task_profiles(
-                        start=(smallest + diff * low),
-                        end=(smallest + diff * high))
-
-                # (Querying based on % of total number of tasks that were
-                # run.)
-                elif breakdown_opt.value == total_tasks_value:
-                    if range_slider.value[0] == 0:
-                        tasks = _truncated_task_profiles(
-                            num_tasks=(int(num_tasks * high)), fwd=True)
-                    else:
-                        tasks = _truncated_task_profiles(
-                            num_tasks=(int(num_tasks * (high - low))),
-                            fwd=False)
-
-                update(smallest, largest, num_tasks, tasks)
-
     # Get updated values from a slider or text box, and update the rest of
     # them accordingly.
     range_slider.observe(update_wrapper, names="value")
@@ -268,20 +241,6 @@ def handle_submit(sender):
 MAX_TASKS_TO_VISUALIZE = 10000
 
 
-# Wrapper that enforces a limit on the number of tasks to visualize
-def _truncated_task_profiles(start=None, end=None, num_tasks=None, fwd=True):
-    if num_tasks is None:
-        num_tasks = MAX_TASKS_TO_VISUALIZE
-        print("Warning: at most {} tasks will be fetched within this "
-              "time range.".format(MAX_TASKS_TO_VISUALIZE))
-    elif num_tasks > MAX_TASKS_TO_VISUALIZE:
-        print("Warning: too many tasks to visualize, "
-              "fetching only the first {} of {}.".format(
-                  MAX_TASKS_TO_VISUALIZE, num_tasks))
-        num_tasks = MAX_TASKS_TO_VISUALIZE
-    return ray.global_state.task_profiles(num_tasks, start, end, fwd)
-
-
 # Helper function that guarantees unique and writeable temp files.
 # Prevents clashes in task trace files when multiple notebooks are running.
 def _get_temp_file_path(**kwargs):
@@ -293,32 +252,43 @@ def _get_temp_file_path(**kwargs):
 
 
 def task_timeline():
-    path_input = widgets.Button(description="View task timeline")
+    # Check that the trace viewer renderer file is present, and copy it to the
+    # current working directory if it is not present.
+    if not os.path.exists("trace_viewer_full.html"):
+        shutil.copy(
+            os.path.join(
+                os.path.dirname(os.path.abspath(__file__)),
+                "../core/src/catapult_files/trace_viewer_full.html"),
+            "trace_viewer_full.html")
 
-    breakdown_basic = "Basic"
-    breakdown_task = "Task Breakdowns"
+    trace_viewer_path = os.path.join(
+        os.path.dirname(os.path.abspath(__file__)),
+        "../core/src/catapult_files/index.html")
 
-    breakdown_opt = widgets.Dropdown(
-        options=["Basic", "Task Breakdowns"],
-        value="Task Breakdowns",
-        disabled=False,
-    )
-    obj_dep = widgets.Checkbox(
-        value=True, disabled=False, layout=widgets.Layout(width='20px'))
-    task_dep = widgets.Checkbox(
-        value=True, disabled=False, layout=widgets.Layout(width='20px'))
-    # Labels to bypass width limitation for descriptions.
-    label_tasks = widgets.Label(
-        value='Task submissions', layout=widgets.Layout(width='110px'))
-    label_objects = widgets.Label(
-        value='Object dependencies', layout=widgets.Layout(width='130px'))
-    label_options = widgets.Label(
-        value='View options:', layout=widgets.Layout(width='100px'))
-    start_box, end_box, range_slider, time_opt = get_sliders(False)
-    display(widgets.HBox([task_dep, label_tasks, obj_dep, label_objects]))
-    display(widgets.HBox([label_options, breakdown_opt]))
-    display(path_input)
+    html_file_path = _get_temp_file_path(suffix=".html")
+    json_file_path = _get_temp_file_path(suffix=".json")
+
+    ray.global_state.chrome_tracing_dump(filename=json_file_path)
+
+    with open(trace_viewer_path) as f:
+        data = f.read()
+
+    # Replace the demo data path with our own
+    # https://github.com/catapult-project/catapult/blob/
+    # 33a9271eb3cf5caf925293ec6a4b47c94f1ac968/tracing/bin/index.html#L107
+    data = data.replace("../test_data/big_trace.json", json_file_path)
+
+    with open(html_file_path, "w+") as f:
+        f.write(data)
 
+    # Display the task trace within the Jupyter notebook
+    clear_output(wait=True)
+    logger.info("To view fullscreen, open chrome://tracing in Google Chrome "
+                "and load `{}`".format(os.path.abspath(json_file_path)))
+    display(IFrame(html_file_path, 900, 800))
+
+
+def object_transfer_timeline():
     # Check that the trace viewer renderer file is present, and copy it to the
     # current working directory if it is not present.
     if not os.path.exists("trace_viewer_full.html"):
@@ -328,76 +298,32 @@ def task_timeline():
                 "../core/src/catapult_files/trace_viewer_full.html"),
             "trace_viewer_full.html")
 
-    def handle_submit(sender):
-        json_tmp = tempfile.mktemp() + ".json"
-
-        # Determine whether task components should be displayed or not.
-        if breakdown_opt.value == breakdown_basic:
-            breakdown = False
-        elif breakdown_opt.value == breakdown_task:
-            breakdown = True
-        else:
-            raise ValueError("Unexpected breakdown value '{}'".format(
-                breakdown_opt.value))
-
-        low, high = map(lambda x: x / 100., range_slider.value)
-
-        smallest, largest, num_tasks = ray.global_state._job_length()
-        diff = largest - smallest
-
-        if time_opt.value == total_time_value:
-            tasks = _truncated_task_profiles(
-                start=smallest + diff * low, end=smallest + diff * high)
-        elif time_opt.value == total_tasks_value:
-            if range_slider.value[0] == 0:
-                tasks = _truncated_task_profiles(
-                    num_tasks=int(num_tasks * high), fwd=True)
-            else:
-                tasks = _truncated_task_profiles(
-                    num_tasks=int(num_tasks * (high - low)), fwd=False)
-        else:
-            raise ValueError("Unexpected time value '{}'".format(
-                time_opt.value))
-        # Write trace to a JSON file
-        print("Collected profiles for {} tasks.".format(len(tasks)))
-        print("Dumping task profile data to {}, "
-              "this might take a while...".format(json_tmp))
-        ray.global_state.dump_catapult_trace(
-            json_tmp,
-            tasks,
-            breakdowns=breakdown,
-            obj_dep=obj_dep.value,
-            task_dep=task_dep.value)
-        print("Opening html file in browser...")
-
-        trace_viewer_path = os.path.join(
-            os.path.dirname(os.path.abspath(__file__)),
-            "../core/src/catapult_files/index.html")
-
-        html_file_path = _get_temp_file_path(suffix=".html")
-        json_file_path = _get_temp_file_path(suffix=".json")
-
-        print("Pointing to {} named {}".format(json_tmp, json_file_path))
-        shutil.copy(json_tmp, json_file_path)
-
-        with open(trace_viewer_path) as f:
-            data = f.read()
-
-        # Replace the demo data path with our own
-        # https://github.com/catapult-project/catapult/blob/
-        # 33a9271eb3cf5caf925293ec6a4b47c94f1ac968/tracing/bin/index.html#L107
-        data = data.replace("../test_data/big_trace.json", json_file_path)
-
-        with open(html_file_path, "w+") as f:
-            f.write(data)
-
-        # Display the task trace within the Jupyter notebook
-        clear_output(wait=True)
-        print("To view fullscreen, open chrome://tracing in Google Chrome "
-              "and load `{}`".format(json_tmp))
-        display(IFrame(html_file_path, 900, 800))
-
-    path_input.on_click(handle_submit)
+    trace_viewer_path = os.path.join(
+        os.path.dirname(os.path.abspath(__file__)),
+        "../core/src/catapult_files/index.html")
+
+    html_file_path = _get_temp_file_path(suffix=".html")
+    json_file_path = _get_temp_file_path(suffix=".json")
+
+    ray.global_state.chrome_tracing_object_transfer_dump(
+        filename=json_file_path)
+
+    with open(trace_viewer_path) as f:
+        data = f.read()
+
+    # Replace the demo data path with our own
+    # https://github.com/catapult-project/catapult/blob/
+    # 33a9271eb3cf5caf925293ec6a4b47c94f1ac968/tracing/bin/index.html#L107
+    data = data.replace("../test_data/big_trace.json", json_file_path)
+
+    with open(html_file_path, "w+") as f:
+        f.write(data)
+
+    # Display the task trace within the Jupyter notebook
+    clear_output(wait=True)
+    logger.info("To view fullscreen, open chrome://tracing in Google Chrome "
+                "and load `{}`".format(os.path.abspath(json_file_path)))
+    display(IFrame(html_file_path, 900, 800))
 
 
 def task_completion_time_distribution():
@@ -562,12 +488,7 @@ def cpu_usage():
     output_notebook(resources=CDN)
 
     # Parse the client table to determine how many CPUs are available
-    num_cpus = 0
-    client_table = ray.global_state.client_table()
-    for node_ip, client_list in client_table.items():
-        for client in client_list:
-            if "CPU" in client:
-                num_cpus += client["CPU"]
+    num_cpus = ray.global_state.cluster_resources()["CPU"]
 
     # Update the plot based on the sliders
     def plot_utilization():
diff --git a/python/ray/function_manager.py b/python/ray/function_manager.py
new file mode 100644
index 0000000000000..72ec53651df76
--- /dev/null
+++ b/python/ray/function_manager.py
@@ -0,0 +1,495 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import hashlib
+import inspect
+import json
+import sys
+import time
+import traceback
+from collections import (
+    namedtuple,
+    defaultdict,
+)
+
+import ray
+from ray import profiling
+from ray import ray_constants
+from ray import cloudpickle as pickle
+from ray.utils import (
+    is_cython,
+    is_function_or_method,
+    is_class_method,
+    check_oversized_pickle,
+    decode,
+    format_error_message,
+    push_error_to_driver,
+)
+
+FunctionExecutionInfo = namedtuple("FunctionExecutionInfo",
+                                   ["function", "function_name", "max_calls"])
+"""FunctionExecutionInfo: A named tuple storing remote function information."""
+
+
+class FunctionActorManager(object):
+    """A class used to export/load remote functions and actors.
+
+    Attributes:
+        _worker: The associated worker that this manager related.
+        _functions_to_export: The remote functions to export when
+            the worker gets connected.
+        _actors_to_export: The actors to export when the worker gets
+            connected.
+        _function_execution_info: The map from driver_id to finction_id
+            and execution_info.
+        _num_task_executions: The map from driver_id to function
+            execution times.
+    """
+
+    def __init__(self, worker):
+        self._worker = worker
+        self._functions_to_export = []
+        self._actors_to_export = []
+        # This field is a dictionary that maps a driver ID to a dictionary of
+        # functions (and information about those functions) that have been
+        # registered for that driver (this inner dictionary maps function IDs
+        # to a FunctionExecutionInfo object. This should only be used on
+        # workers that execute remote functions.
+        self._function_execution_info = defaultdict(lambda: {})
+        self._num_task_executions = defaultdict(lambda: {})
+
+    def increase_task_counter(self, driver_id, function_id):
+        self._num_task_executions[driver_id][function_id] += 1
+
+    def get_task_counter(self, driver_id, function_id):
+        return self._num_task_executions[driver_id][function_id]
+
+    def export_cached(self):
+        """Export cached remote functions
+
+        Note: this should be called only once when worker is connected.
+        """
+        for remote_function in self._functions_to_export:
+            self._do_export(remote_function)
+        self._functions_to_export = None
+        for info in self._actors_to_export:
+            (key, actor_class_info) = info
+            self._publish_actor_class_to_key(key, actor_class_info)
+
+    def reset_cache(self):
+        self._functions_to_export = []
+        self._actors_to_export = []
+
+    def export(self, remote_function):
+        """Export a remote function.
+
+        Args:
+            remote_function: the RemoteFunction object.
+        """
+        if self._worker.mode is None:
+            # If the worker isn't connected, cache the function
+            # and export it later.
+            self._functions_to_export.append(remote_function)
+            return
+        if self._worker.mode != ray.worker.SCRIPT_MODE:
+            # Don't need to export if the worker is not a driver.
+            return
+        self._do_export(remote_function)
+
+    def _do_export(self, remote_function):
+        """Pickle a remote function and export it to redis.
+
+        Args:
+            remote_function: the RemoteFunction object.
+        """
+        # Work around limitations of Python pickling.
+        function = remote_function._function
+        function_name_global_valid = function.__name__ in function.__globals__
+        function_name_global_value = function.__globals__.get(
+            function.__name__)
+        # Allow the function to reference itself as a global variable
+        if not is_cython(function):
+            function.__globals__[function.__name__] = remote_function
+        try:
+            pickled_function = pickle.dumps(function)
+        finally:
+            # Undo our changes
+            if function_name_global_valid:
+                function.__globals__[function.__name__] = (
+                    function_name_global_value)
+            else:
+                del function.__globals__[function.__name__]
+
+        check_oversized_pickle(pickled_function,
+                               remote_function._function_name,
+                               "remote function", self._worker)
+
+        key = (b"RemoteFunction:" + self._worker.task_driver_id.id() + b":" +
+               remote_function._function_id)
+        self._worker.redis_client.hmset(
+            key, {
+                "driver_id": self._worker.task_driver_id.id(),
+                "function_id": remote_function._function_id,
+                "name": remote_function._function_name,
+                "module": function.__module__,
+                "function": pickled_function,
+                "max_calls": remote_function._max_calls
+            })
+        self._worker.redis_client.rpush("Exports", key)
+
+    def fetch_and_register_remote_function(self, key):
+        """Import a remote function."""
+        (driver_id, function_id_str, function_name, serialized_function,
+         num_return_vals, module, resources,
+         max_calls) = self._worker.redis_client.hmget(key, [
+             "driver_id", "function_id", "name", "function", "num_return_vals",
+             "module", "resources", "max_calls"
+         ])
+        function_id = ray.ObjectID(function_id_str)
+        function_name = decode(function_name)
+        max_calls = int(max_calls)
+        module = decode(module)
+
+        # This is a placeholder in case the function can't be unpickled. This
+        # will be overwritten if the function is successfully registered.
+        def f():
+            raise Exception("This function was not imported properly.")
+
+        self._function_execution_info[driver_id][function_id.id()] = (
+            FunctionExecutionInfo(
+                function=f, function_name=function_name, max_calls=max_calls))
+        self._num_task_executions[driver_id][function_id.id()] = 0
+
+        try:
+            function = pickle.loads(serialized_function)
+        except Exception:
+            # If an exception was thrown when the remote function was imported,
+            # we record the traceback and notify the scheduler of the failure.
+            traceback_str = format_error_message(traceback.format_exc())
+            # Log the error message.
+            push_error_to_driver(
+                self._worker,
+                ray_constants.REGISTER_REMOTE_FUNCTION_PUSH_ERROR,
+                traceback_str,
+                driver_id=driver_id,
+                data={
+                    "function_id": function_id.id(),
+                    "function_name": function_name
+                })
+        else:
+            # The below line is necessary. Because in the driver process,
+            # if the function is defined in the file where the python script
+            # was started from, its module is `__main__`.
+            # However in the worker process, the `__main__` module is a
+            # different module, which is `default_worker.py`
+            function.__module__ = module
+            self._function_execution_info[driver_id][function_id.id()] = (
+                FunctionExecutionInfo(
+                    function=function,
+                    function_name=function_name,
+                    max_calls=max_calls))
+            # Add the function to the function table.
+            self._worker.redis_client.rpush(
+                b"FunctionTable:" + function_id.id(), self._worker.worker_id)
+
+    def get_execution_info(self, driver_id, function_id):
+        """Get the FunctionExecutionInfo of a remote function.
+
+        Args:
+            driver_id: ID of the driver that the function belongs to.
+            function_id: ID of the function to get.
+
+        Returns:
+            A FunctionExecutionInfo object.
+        """
+        # Wait until the function to be executed has actually been registered
+        # on this worker. We will push warnings to the user if we spend too
+        # long in this loop.
+        with profiling.profile("wait_for_function", worker=self._worker):
+            self._wait_for_function(function_id, driver_id)
+        return self._function_execution_info[driver_id][function_id.id()]
+
+    def _wait_for_function(self, function_id, driver_id, timeout=10):
+        """Wait until the function to be executed is present on this worker.
+
+        This method will simply loop until the import thread has imported the
+        relevant function. If we spend too long in this loop, that may indicate
+        a problem somewhere and we will push an error message to the user.
+
+        If this worker is an actor, then this will wait until the actor has
+        been defined.
+
+        Args:
+            function_id (str): The ID of the function that we want to execute.
+            driver_id (str): The ID of the driver to push the error message to
+                if this times out.
+        """
+        start_time = time.time()
+        # Only send the warning once.
+        warning_sent = False
+        while True:
+            with self._worker.lock:
+                if (self._worker.actor_id == ray.worker.NIL_ACTOR_ID
+                        and (function_id.id() in
+                             self._function_execution_info[driver_id])):
+                    break
+                elif self._worker.actor_id != ray.worker.NIL_ACTOR_ID and (
+                        self._worker.actor_id in self._worker.actors):
+                    break
+                if time.time() - start_time > timeout:
+                    warning_message = ("This worker was asked to execute a "
+                                       "function that it does not have "
+                                       "registered. You may have to restart "
+                                       "Ray.")
+                    if not warning_sent:
+                        ray.utils.push_error_to_driver(
+                            self._worker,
+                            ray_constants.WAIT_FOR_FUNCTION_PUSH_ERROR,
+                            warning_message,
+                            driver_id=driver_id)
+                    warning_sent = True
+            time.sleep(0.001)
+
+    @classmethod
+    def compute_actor_method_function_id(cls, class_name, attr):
+        """Get the function ID corresponding to an actor method.
+
+        Args:
+            class_name (str): The class name of the actor.
+            attr (str): The attribute name of the method.
+
+        Returns:
+            Function ID corresponding to the method.
+        """
+        function_id_hash = hashlib.sha1()
+        function_id_hash.update(class_name.encode("ascii"))
+        function_id_hash.update(attr.encode("ascii"))
+        function_id = function_id_hash.digest()
+        assert len(function_id) == ray_constants.ID_SIZE
+        return ray.ObjectID(function_id)
+
+    def _publish_actor_class_to_key(self, key, actor_class_info):
+        """Push an actor class definition to Redis.
+
+        The is factored out as a separate function because it is also called
+        on cached actor class definitions when a worker connects for the first
+        time.
+
+        Args:
+            key: The key to store the actor class info at.
+            actor_class_info: Information about the actor class.
+            worker: The worker to use to connect to Redis.
+        """
+        # We set the driver ID here because it may not have been available when
+        # the actor class was defined.
+        actor_class_info["driver_id"] = self._worker.task_driver_id.id()
+        self._worker.redis_client.hmset(key, actor_class_info)
+        self._worker.redis_client.rpush("Exports", key)
+
+    def export_actor_class(self, class_id, Class, actor_method_names,
+                           checkpoint_interval):
+        key = b"ActorClass:" + class_id
+        actor_class_info = {
+            "class_name": Class.__name__,
+            "module": Class.__module__,
+            "class": pickle.dumps(Class),
+            "checkpoint_interval": checkpoint_interval,
+            "actor_method_names": json.dumps(list(actor_method_names))
+        }
+
+        check_oversized_pickle(actor_class_info["class"],
+                               actor_class_info["class_name"], "actor",
+                               self._worker)
+
+        if self._worker.mode is None:
+            # This means that 'ray.init()' has not been called yet and so we
+            # must cache the actor class definition and export it when
+            # 'ray.init()' is called.
+            assert self._actors_to_export is not None
+            self._actors_to_export.append((key, actor_class_info))
+            # This caching code path is currently not used because we only
+            # export actor class definitions lazily when we instantiate the
+            # actor for the first time.
+            assert False, "This should be unreachable."
+        else:
+            self._publish_actor_class_to_key(key, actor_class_info)
+            # TODO(rkn): Currently we allow actor classes to be defined
+            # within tasks. I tried to disable this, but it may be necessary
+            # because of https://github.com/ray-project/ray/issues/1146.
+
+    def fetch_and_register_actor(self, actor_class_key):
+        """Import an actor.
+
+        This will be called by the worker's import thread when the worker
+        receives the actor_class export, assuming that the worker is an actor
+        for that class.
+
+        Args:
+            actor_class_key: The key in Redis to use to fetch the actor.
+            worker: The worker to use.
+        """
+        actor_id_str = self._worker.actor_id
+        (driver_id, class_id, class_name, module, pickled_class,
+         checkpoint_interval,
+         actor_method_names) = self._worker.redis_client.hmget(
+             actor_class_key, [
+                 "driver_id", "class_id", "class_name", "module", "class",
+                 "checkpoint_interval", "actor_method_names"
+             ])
+
+        class_name = decode(class_name)
+        module = decode(module)
+        checkpoint_interval = int(checkpoint_interval)
+        actor_method_names = json.loads(decode(actor_method_names))
+
+        # In Python 2, json loads strings as unicode, so convert them back to
+        # strings.
+        if sys.version_info < (3, 0):
+            actor_method_names = [
+                method_name.encode("ascii")
+                for method_name in actor_method_names
+            ]
+
+        # Create a temporary actor with some temporary methods so that if
+        # the actor fails to be unpickled, the temporary actor can be used
+        # (just to produce error messages and to prevent the driver from
+        # hanging).
+        class TemporaryActor(object):
+            pass
+
+        self._worker.actors[actor_id_str] = TemporaryActor()
+        self._worker.actor_checkpoint_interval = checkpoint_interval
+
+        def temporary_actor_method(*xs):
+            raise Exception(
+                "The actor with name {} failed to be imported, "
+                "and so cannot execute this method".format(class_name))
+
+        # Register the actor method executors.
+        for actor_method_name in actor_method_names:
+            function_id = (
+                FunctionActorManager.compute_actor_method_function_id(
+                    class_name, actor_method_name).id())
+            temporary_executor = self._make_actor_method_executor(
+                actor_method_name,
+                temporary_actor_method,
+                actor_imported=False)
+            self._function_execution_info[driver_id][function_id] = (
+                FunctionExecutionInfo(
+                    function=temporary_executor,
+                    function_name=actor_method_name,
+                    max_calls=0))
+            self._num_task_executions[driver_id][function_id] = 0
+
+        try:
+            unpickled_class = pickle.loads(pickled_class)
+            self._worker.actor_class = unpickled_class
+        except Exception:
+            # If an exception was thrown when the actor was imported, we record
+            # the traceback and notify the scheduler of the failure.
+            traceback_str = ray.utils.format_error_message(
+                traceback.format_exc())
+            # Log the error message.
+            push_error_to_driver(
+                self._worker,
+                ray_constants.REGISTER_ACTOR_PUSH_ERROR,
+                traceback_str,
+                driver_id,
+                data={"actor_id": actor_id_str})
+            # TODO(rkn): In the future, it might make sense to have the worker
+            # exit here. However, currently that would lead to hanging if
+            # someone calls ray.get on a method invoked on the actor.
+        else:
+            # TODO(pcm): Why is the below line necessary?
+            unpickled_class.__module__ = module
+            self._worker.actors[actor_id_str] = unpickled_class.__new__(
+                unpickled_class)
+
+            actor_methods = inspect.getmembers(
+                unpickled_class, predicate=is_function_or_method)
+            for actor_method_name, actor_method in actor_methods:
+                function_id = (
+                    FunctionActorManager.compute_actor_method_function_id(
+                        class_name, actor_method_name).id())
+                executor = self._make_actor_method_executor(
+                    actor_method_name, actor_method, actor_imported=True)
+                self._function_execution_info[driver_id][function_id] = (
+                    FunctionExecutionInfo(
+                        function=executor,
+                        function_name=actor_method_name,
+                        max_calls=0))
+                # We do not set function_properties[driver_id][function_id]
+                # because we currently do need the actor worker to submit new
+                # tasks for the actor.
+
+    def _make_actor_method_executor(self, method_name, method, actor_imported):
+        """Make an executor that wraps a user-defined actor method.
+
+        The wrapped method updates the worker's internal state and performs any
+        necessary checkpointing operations.
+
+        Args:
+            worker (Worker): The worker that is executing the actor.
+            method_name (str): The name of the actor method.
+            method (instancemethod): The actor method to wrap. This should be a
+                method defined on the actor class and should therefore take an
+                instance of the actor as the first argument.
+            actor_imported (bool): Whether the actor has been imported.
+                Checkpointing operations will not be run if this is set to
+                False.
+
+        Returns:
+            A function that executes the given actor method on the worker's
+                stored instance of the actor. The function also updates the
+                worker's internal state to record the executed method.
+        """
+
+        def actor_method_executor(dummy_return_id, actor, *args):
+            # Update the actor's task counter to reflect the task we're about
+            # to execute.
+            self._worker.actor_task_counter += 1
+
+            # If this is the first task to execute on the actor, try to resume
+            # from a checkpoint.
+            if actor_imported and self._worker.actor_task_counter == 1:
+                checkpoint_resumed = ray.actor.restore_and_log_checkpoint(
+                    self._worker, actor)
+                if checkpoint_resumed:
+                    # NOTE(swang): Since we did not actually execute the
+                    # __init__ method, this will put None as the return value.
+                    # If the __init__ method is supposed to return multiple
+                    # values, an exception will be logged.
+                    return
+
+            # Determine whether we should checkpoint the actor.
+            checkpointing_on = (actor_imported
+                                and self._worker.actor_checkpoint_interval > 0)
+            # We should checkpoint the actor if user checkpointing is on, we've
+            # executed checkpoint_interval tasks since the last checkpoint, and
+            # the method we're about to execute is not a checkpoint.
+            save_checkpoint = (checkpointing_on
+                               and (self._worker.actor_task_counter %
+                                    self._worker.actor_checkpoint_interval == 0
+                                    and method_name != "__ray_checkpoint__"))
+
+            # Execute the assigned method and save a checkpoint if necessary.
+            try:
+                if is_class_method(method):
+                    method_returns = method(*args)
+                else:
+                    method_returns = method(actor, *args)
+            except Exception:
+                # Save the checkpoint before allowing the method exception
+                # to be thrown.
+                if save_checkpoint:
+                    ray.actor.save_and_log_checkpoint(self._worker, actor)
+                raise
+            else:
+                # Save the checkpoint before returning the method's return
+                # values.
+                if save_checkpoint:
+                    ray.actor.save_and_log_checkpoint(self._worker, actor)
+                return method_returns
+
+        return actor_method_executor
diff --git a/python/ray/gcs_utils.py b/python/ray/gcs_utils.py
index 2616e064d850f..347f7ab9f8064 100644
--- a/python/ray/gcs_utils.py
+++ b/python/ray/gcs_utils.py
@@ -4,19 +4,6 @@
 
 import flatbuffers
 
-from ray.core.generated.ResultTableReply import ResultTableReply
-from ray.core.generated.SubscribeToNotificationsReply \
-    import SubscribeToNotificationsReply
-from ray.core.generated.TaskExecutionDependencies import \
-    TaskExecutionDependencies
-from ray.core.generated.TaskReply import TaskReply
-from ray.core.generated.DriverTableMessage import DriverTableMessage
-from ray.core.generated.LocalSchedulerInfoMessage import \
-    LocalSchedulerInfoMessage
-from ray.core.generated.SubscribeToDBClientTableReply import \
-    SubscribeToDBClientTableReply
-from ray.core.generated.TaskInfo import TaskInfo
-
 import ray.core.generated.ErrorTableData
 
 from ray.core.generated.GcsTableEntry import GcsTableEntry
@@ -24,6 +11,7 @@
 from ray.core.generated.ErrorTableData import ErrorTableData
 from ray.core.generated.ProfileTableData import ProfileTableData
 from ray.core.generated.HeartbeatTableData import HeartbeatTableData
+from ray.core.generated.HeartbeatBatchTableData import HeartbeatBatchTableData
 from ray.core.generated.DriverTableData import DriverTableData
 from ray.core.generated.ObjectTableData import ObjectTableData
 from ray.core.generated.ray.protocol.Task import Task
@@ -32,31 +20,17 @@
 from ray.core.generated.TablePubsub import TablePubsub
 
 __all__ = [
-    "SubscribeToNotificationsReply", "ResultTableReply",
-    "TaskExecutionDependencies", "TaskReply", "DriverTableMessage",
-    "LocalSchedulerInfoMessage", "SubscribeToDBClientTableReply", "TaskInfo",
     "GcsTableEntry", "ClientTableData", "ErrorTableData", "HeartbeatTableData",
-    "DriverTableData", "ProfileTableData", "ObjectTableData", "Task",
-    "TablePrefix", "TablePubsub", "construct_error_message"
+    "HeartbeatBatchTableData", "DriverTableData", "ProfileTableData",
+    "ObjectTableData", "Task", "TablePrefix", "TablePubsub",
+    "construct_error_message"
 ]
 
-# These prefixes must be kept up-to-date with the definitions in
-# ray_redis_module.cc.
-DB_CLIENT_PREFIX = "CL:"
-TASK_PREFIX = "TT:"
-OBJECT_CHANNEL_PREFIX = "OC:"
-OBJECT_INFO_PREFIX = "OI:"
-OBJECT_LOCATION_PREFIX = "OL:"
 FUNCTION_PREFIX = "RemoteFunction:"
 
-# These prefixes must be kept up-to-date with the definitions in
-# common/state/redis.cc
-LOCAL_SCHEDULER_INFO_CHANNEL = b"local_schedulers"
-PLASMA_MANAGER_HEARTBEAT_CHANNEL = b"plasma_managers"
-DRIVER_DEATH_CHANNEL = b"driver_deaths"
-
 # xray heartbeats
 XRAY_HEARTBEAT_CHANNEL = str(TablePubsub.HEARTBEAT).encode("ascii")
+XRAY_HEARTBEAT_BATCH_CHANNEL = str(TablePubsub.HEARTBEAT_BATCH).encode("ascii")
 
 # xray driver updates
 XRAY_DRIVER_CHANNEL = str(TablePubsub.DRIVER).encode("ascii")
diff --git a/python/ray/global_scheduler/__init__.py b/python/ray/global_scheduler/__init__.py
deleted file mode 100644
index 25e4d2cf6490c..0000000000000
--- a/python/ray/global_scheduler/__init__.py
+++ /dev/null
@@ -1,7 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-from .global_scheduler_services import start_global_scheduler
-
-__all__ = ["start_global_scheduler"]
diff --git a/python/ray/global_scheduler/build/.gitkeep b/python/ray/global_scheduler/build/.gitkeep
deleted file mode 100644
index e69de29bb2d1d..0000000000000
diff --git a/python/ray/global_scheduler/global_scheduler_services.py b/python/ray/global_scheduler/global_scheduler_services.py
deleted file mode 100644
index 7e3d019ffa980..0000000000000
--- a/python/ray/global_scheduler/global_scheduler_services.py
+++ /dev/null
@@ -1,61 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import os
-import subprocess
-import time
-
-
-def start_global_scheduler(redis_address,
-                           node_ip_address,
-                           use_valgrind=False,
-                           use_profiler=False,
-                           stdout_file=None,
-                           stderr_file=None):
-    """Start a global scheduler process.
-
-    Args:
-        redis_address (str): The address of the Redis instance.
-        node_ip_address: The IP address of the node that this scheduler will
-            run on.
-        use_valgrind (bool): True if the global scheduler should be started
-            inside of valgrind. If this is True, use_profiler must be False.
-        use_profiler (bool): True if the global scheduler should be started
-            inside a profiler. If this is True, use_valgrind must be False.
-        stdout_file: A file handle opened for writing to redirect stdout to. If
-            no redirection should happen, then this should be None.
-        stderr_file: A file handle opened for writing to redirect stderr to. If
-            no redirection should happen, then this should be None.
-
-    Return:
-        The process ID of the global scheduler process.
-    """
-    if use_valgrind and use_profiler:
-        raise Exception("Cannot use valgrind and profiler at the same time.")
-    global_scheduler_executable = os.path.join(
-        os.path.abspath(os.path.dirname(__file__)),
-        "../core/src/global_scheduler/global_scheduler")
-    command = [
-        global_scheduler_executable, "-r", redis_address, "-h", node_ip_address
-    ]
-    if use_valgrind:
-        pid = subprocess.Popen(
-            [
-                "valgrind", "--track-origins=yes", "--leak-check=full",
-                "--show-leak-kinds=all", "--leak-check-heuristics=stdstring",
-                "--error-exitcode=1"
-            ] + command,
-            stdout=stdout_file,
-            stderr=stderr_file)
-        time.sleep(1.0)
-    elif use_profiler:
-        pid = subprocess.Popen(
-            ["valgrind", "--tool=callgrind"] + command,
-            stdout=stdout_file,
-            stderr=stderr_file)
-        time.sleep(1.0)
-    else:
-        pid = subprocess.Popen(command, stdout=stdout_file, stderr=stderr_file)
-        time.sleep(0.1)
-    return pid
diff --git a/python/ray/global_scheduler/test/test.py b/python/ray/global_scheduler/test/test.py
deleted file mode 100644
index 37aad62ee1b01..0000000000000
--- a/python/ray/global_scheduler/test/test.py
+++ /dev/null
@@ -1,332 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import numpy as np
-import os
-import random
-import signal
-import sys
-import time
-import unittest
-
-# The ray import must come before the pyarrow import because ray modifies the
-# python path so that the right version of pyarrow is found.
-import ray.global_scheduler as global_scheduler
-import ray.local_scheduler as local_scheduler
-import ray.plasma as plasma
-from ray.plasma.utils import create_object
-from ray import services
-from ray.experimental import state
-import ray.ray_constants as ray_constants
-import pyarrow as pa
-
-USE_VALGRIND = False
-PLASMA_STORE_MEMORY = 1000000000
-NUM_CLUSTER_NODES = 2
-
-NIL_WORKER_ID = ray_constants.ID_SIZE * b"\xff"
-NIL_OBJECT_ID = ray_constants.ID_SIZE * b"\xff"
-NIL_ACTOR_ID = ray_constants.ID_SIZE * b"\xff"
-
-
-def random_driver_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-def random_task_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-def random_function_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-def random_object_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-def new_port():
-    return random.randint(10000, 65535)
-
-
-class TestGlobalScheduler(unittest.TestCase):
-    def setUp(self):
-        # Start one Redis server and N pairs of (plasma, local_scheduler)
-        self.node_ip_address = "127.0.0.1"
-        redis_address, redis_shards = services.start_redis(
-            self.node_ip_address)
-        redis_port = services.get_port(redis_address)
-        time.sleep(0.1)
-        # Create a client for the global state store.
-        self.state = state.GlobalState()
-        self.state._initialize_global_state(self.node_ip_address, redis_port)
-
-        # Start one global scheduler.
-        self.p1 = global_scheduler.start_global_scheduler(
-            redis_address, self.node_ip_address, use_valgrind=USE_VALGRIND)
-        self.plasma_store_pids = []
-        self.plasma_manager_pids = []
-        self.local_scheduler_pids = []
-        self.plasma_clients = []
-        self.local_scheduler_clients = []
-
-        for i in range(NUM_CLUSTER_NODES):
-            # Start the Plasma store. Plasma store name is randomly generated.
-            plasma_store_name, p2 = plasma.start_plasma_store()
-            self.plasma_store_pids.append(p2)
-            # Start the Plasma manager.
-            # Assumption: Plasma manager name and port are randomly generated
-            # by the plasma module.
-            manager_info = plasma.start_plasma_manager(plasma_store_name,
-                                                       redis_address)
-            plasma_manager_name, p3, plasma_manager_port = manager_info
-            self.plasma_manager_pids.append(p3)
-            plasma_address = "{}:{}".format(self.node_ip_address,
-                                            plasma_manager_port)
-            plasma_client = pa.plasma.connect(plasma_store_name,
-                                              plasma_manager_name, 64)
-            self.plasma_clients.append(plasma_client)
-            # Start the local scheduler.
-            local_scheduler_name, p4 = local_scheduler.start_local_scheduler(
-                plasma_store_name,
-                plasma_manager_name=plasma_manager_name,
-                plasma_address=plasma_address,
-                redis_address=redis_address,
-                static_resources={"CPU": 10})
-            # Connect to the scheduler.
-            local_scheduler_client = local_scheduler.LocalSchedulerClient(
-                local_scheduler_name, NIL_WORKER_ID, False, random_task_id(),
-                False)
-            self.local_scheduler_clients.append(local_scheduler_client)
-            self.local_scheduler_pids.append(p4)
-
-    def tearDown(self):
-        # Check that the processes are still alive.
-        self.assertEqual(self.p1.poll(), None)
-        for p2 in self.plasma_store_pids:
-            self.assertEqual(p2.poll(), None)
-        for p3 in self.plasma_manager_pids:
-            self.assertEqual(p3.poll(), None)
-        for p4 in self.local_scheduler_pids:
-            self.assertEqual(p4.poll(), None)
-
-        redis_processes = services.all_processes[
-            services.PROCESS_TYPE_REDIS_SERVER]
-        for redis_process in redis_processes:
-            self.assertEqual(redis_process.poll(), None)
-
-        # Kill the global scheduler.
-        if USE_VALGRIND:
-            self.p1.send_signal(signal.SIGTERM)
-            self.p1.wait()
-            if self.p1.returncode != 0:
-                os._exit(-1)
-        else:
-            self.p1.kill()
-        # Kill local schedulers, plasma managers, and plasma stores.
-        for p2 in self.local_scheduler_pids:
-            p2.kill()
-        for p3 in self.plasma_manager_pids:
-            p3.kill()
-        for p4 in self.plasma_store_pids:
-            p4.kill()
-        # Kill Redis. In the event that we are using valgrind, this needs to
-        # happen after we kill the global scheduler.
-        while redis_processes:
-            redis_process = redis_processes.pop()
-            redis_process.kill()
-
-    def get_plasma_manager_id(self):
-        """Get the db_client_id with client_type equal to plasma_manager.
-
-        Iterates over all the client table keys, gets the db_client_id for the
-        client with client_type matching plasma_manager. Strips the client
-        table prefix. TODO(atumanov): write a separate function to get all
-        plasma manager client IDs.
-
-        Returns:
-          The db_client_id if one is found and otherwise None.
-        """
-        db_client_id = None
-
-        client_list = self.state.client_table()[self.node_ip_address]
-        for client in client_list:
-            if client["ClientType"] == "plasma_manager":
-                db_client_id = client["DBClientID"]
-                break
-
-        return db_client_id
-
-    def test_task_default_resources(self):
-        task1 = local_scheduler.Task(
-            random_driver_id(), random_function_id(), [random_object_id()], 0,
-            random_task_id(), 0)
-        self.assertEqual(task1.required_resources(), {"CPU": 1})
-        task2 = local_scheduler.Task(
-            random_driver_id(), random_function_id(), [random_object_id()], 0,
-            random_task_id(), 0, local_scheduler.ObjectID(NIL_ACTOR_ID),
-            local_scheduler.ObjectID(NIL_OBJECT_ID),
-            local_scheduler.ObjectID(NIL_ACTOR_ID),
-            local_scheduler.ObjectID(NIL_ACTOR_ID), 0, 0, [], {
-                "CPU": 1,
-                "GPU": 2
-            })
-        self.assertEqual(task2.required_resources(), {"CPU": 1, "GPU": 2})
-
-    def test_redis_only_single_task(self):
-        # Tests global scheduler functionality by interacting with Redis and
-        # checking task state transitions in Redis only. TODO(atumanov):
-        # implement.
-
-        # Check precondition for this test:
-        # There should be 2n+1 db clients: the global scheduler + one local
-        # scheduler and one plasma per node.
-        self.assertEqual(
-            len(self.state.client_table()[self.node_ip_address]),
-            2 * NUM_CLUSTER_NODES + 1)
-        db_client_id = self.get_plasma_manager_id()
-        assert (db_client_id is not None)
-
-    @unittest.skipIf(
-        os.environ.get("RAY_USE_NEW_GCS", False),
-        "New GCS API doesn't have a Python API yet.")
-    def test_integration_single_task(self):
-        # There should be three db clients, the global scheduler, the local
-        # scheduler, and the plasma manager.
-        self.assertEqual(
-            len(self.state.client_table()[self.node_ip_address]),
-            2 * NUM_CLUSTER_NODES + 1)
-
-        num_return_vals = [0, 1, 2, 3, 5, 10]
-        # Insert the object into Redis.
-        data_size = 0xf1f0
-        metadata_size = 0x40
-        plasma_client = self.plasma_clients[0]
-        object_dep, memory_buffer, metadata = create_object(
-            plasma_client, data_size, metadata_size, seal=True)
-
-        # Sleep before submitting task to local scheduler.
-        time.sleep(0.1)
-        # Submit a task to Redis.
-        task = local_scheduler.Task(
-            random_driver_id(), random_function_id(),
-            [local_scheduler.ObjectID(object_dep.binary())],
-            num_return_vals[0], random_task_id(), 0)
-        self.local_scheduler_clients[0].submit(task)
-        time.sleep(0.1)
-        # There should now be a task in Redis, and it should get assigned to
-        # the local scheduler
-        num_retries = 10
-        while num_retries > 0:
-            task_entries = self.state.task_table()
-            self.assertLessEqual(len(task_entries), 1)
-            if len(task_entries) == 1:
-                task_id, task = task_entries.popitem()
-                task_status = task["State"]
-                self.assertTrue(task_status in [
-                    state.TASK_STATUS_WAITING, state.TASK_STATUS_SCHEDULED,
-                    state.TASK_STATUS_QUEUED
-                ])
-                if task_status == state.TASK_STATUS_QUEUED:
-                    break
-                else:
-                    print(task_status)
-            print("The task has not been scheduled yet, trying again.")
-            num_retries -= 1
-            time.sleep(1)
-
-        if num_retries <= 0 and task_status != state.TASK_STATUS_QUEUED:
-            # Failed to submit and schedule a single task -- bail.
-            self.tearDown()
-            sys.exit(1)
-
-    def integration_many_tasks_helper(self, timesync=True):
-        # There should be three db clients, the global scheduler, the local
-        # scheduler, and the plasma manager.
-        self.assertEqual(
-            len(self.state.client_table()[self.node_ip_address]),
-            2 * NUM_CLUSTER_NODES + 1)
-        num_return_vals = [0, 1, 2, 3, 5, 10]
-
-        # Submit a bunch of tasks to Redis.
-        num_tasks = 1000
-        for _ in range(num_tasks):
-            # Create a new object for each task.
-            data_size = np.random.randint(1 << 12)
-            metadata_size = np.random.randint(1 << 9)
-            plasma_client = self.plasma_clients[0]
-            object_dep, memory_buffer, metadata = create_object(
-                plasma_client, data_size, metadata_size, seal=True)
-            if timesync:
-                # Give 10ms for object info handler to fire (long enough to
-                # yield CPU).
-                time.sleep(0.010)
-            task = local_scheduler.Task(
-                random_driver_id(), random_function_id(),
-                [local_scheduler.ObjectID(object_dep.binary())],
-                num_return_vals[0], random_task_id(), 0)
-            self.local_scheduler_clients[0].submit(task)
-        # Check that there are the correct number of tasks in Redis and that
-        # they all get assigned to the local scheduler.
-        num_retries = 20
-        num_tasks_done = 0
-        while num_retries > 0:
-            task_entries = self.state.task_table()
-            self.assertLessEqual(len(task_entries), num_tasks)
-            # First, check if all tasks made it to Redis.
-            if len(task_entries) == num_tasks:
-                task_statuses = [
-                    task_entry["State"]
-                    for task_entry in task_entries.values()
-                ]
-                self.assertTrue(
-                    all(status in [
-                        state.TASK_STATUS_WAITING, state.TASK_STATUS_SCHEDULED,
-                        state.TASK_STATUS_QUEUED
-                    ] for status in task_statuses))
-                num_tasks_done = task_statuses.count(state.TASK_STATUS_QUEUED)
-                num_tasks_scheduled = task_statuses.count(
-                    state.TASK_STATUS_SCHEDULED)
-                num_tasks_waiting = task_statuses.count(
-                    state.TASK_STATUS_WAITING)
-                print("tasks in Redis = {}, tasks waiting = {}, "
-                      "tasks scheduled = {}, "
-                      "tasks queued = {}, retries left = {}".format(
-                          len(task_entries), num_tasks_waiting,
-                          num_tasks_scheduled, num_tasks_done, num_retries))
-                if all(status == state.TASK_STATUS_QUEUED
-                       for status in task_statuses):
-                    # We're done, so pass.
-                    break
-            num_retries -= 1
-            time.sleep(0.1)
-
-        # Tasks can either be queued or in the global scheduler due to
-        # spillback.
-        self.assertEqual(num_tasks_done + num_tasks_waiting, num_tasks)
-
-    @unittest.skipIf(
-        os.environ.get("RAY_USE_NEW_GCS", False),
-        "New GCS API doesn't have a Python API yet.")
-    def test_integration_many_tasks_handler_sync(self):
-        self.integration_many_tasks_helper(timesync=True)
-
-    @unittest.skipIf(
-        os.environ.get("RAY_USE_NEW_GCS", False),
-        "New GCS API doesn't have a Python API yet.")
-    def test_integration_many_tasks(self):
-        # More realistic case: should handle out of order object and task
-        # notifications.
-        self.integration_many_tasks_helper(timesync=False)
-
-
-if __name__ == "__main__":
-    if len(sys.argv) > 1:
-        # Pop the argument so we don't mess with unittest's own argument
-        # parser.
-        if sys.argv[-1] == "valgrind":
-            arg = sys.argv.pop()
-            USE_VALGRIND = True
-            print("Using valgrind for tests")
-    unittest.main(verbosity=2)
diff --git a/python/ray/import_thread.py b/python/ray/import_thread.py
index 659cdf1ce281e..70dba322370bb 100644
--- a/python/ray/import_thread.py
+++ b/python/ray/import_thread.py
@@ -88,7 +88,8 @@ def _process_key(self, key):
         if key.startswith(b"RemoteFunction"):
             with profiling.profile(
                     "register_remote_function", worker=self.worker):
-                self.fetch_and_register_remote_function(key)
+                (self.worker.function_actor_manager.
+                 fetch_and_register_remote_function(key))
         elif key.startswith(b"FunctionsToRun"):
             with profiling.profile(
                     "fetch_and_run_function", worker=self.worker):
@@ -103,65 +104,13 @@ def _process_key(self, key):
         else:
             raise Exception("This code should be unreachable.")
 
-    def fetch_and_register_remote_function(self, key):
-        """Import a remote function."""
-        from ray.worker import FunctionExecutionInfo
-        (driver_id, function_id_str, function_name, serialized_function,
-         num_return_vals, module, resources,
-         max_calls) = self.redis_client.hmget(key, [
-             "driver_id", "function_id", "name", "function", "num_return_vals",
-             "module", "resources", "max_calls"
-         ])
-        function_id = ray.ObjectID(function_id_str)
-        function_name = utils.decode(function_name)
-        max_calls = int(max_calls)
-        module = utils.decode(module)
-
-        # This is a placeholder in case the function can't be unpickled. This
-        # will be overwritten if the function is successfully registered.
-        def f():
-            raise Exception("This function was not imported properly.")
-
-        self.worker.function_execution_info[driver_id][function_id.id()] = (
-            FunctionExecutionInfo(
-                function=f, function_name=function_name, max_calls=max_calls))
-        self.worker.num_task_executions[driver_id][function_id.id()] = 0
-
-        try:
-            function = pickle.loads(serialized_function)
-        except Exception:
-            # If an exception was thrown when the remote function was imported,
-            # we record the traceback and notify the scheduler of the failure.
-            traceback_str = utils.format_error_message(traceback.format_exc())
-            # Log the error message.
-            utils.push_error_to_driver(
-                self.worker,
-                ray_constants.REGISTER_REMOTE_FUNCTION_PUSH_ERROR,
-                traceback_str,
-                driver_id=driver_id,
-                data={
-                    "function_id": function_id.id(),
-                    "function_name": function_name
-                })
-        else:
-            # TODO(rkn): Why is the below line necessary?
-            function.__module__ = module
-            self.worker.function_execution_info[driver_id][
-                function_id.id()] = (FunctionExecutionInfo(
-                    function=function,
-                    function_name=function_name,
-                    max_calls=max_calls))
-            # Add the function to the function table.
-            self.redis_client.rpush(b"FunctionTable:" + function_id.id(),
-                                    self.worker.worker_id)
-
     def fetch_and_execute_function_to_run(self, key):
         """Run on arbitrary function on the worker."""
         (driver_id, serialized_function,
          run_on_other_drivers) = self.redis_client.hmget(
              key, ["driver_id", "function", "run_on_other_drivers"])
 
-        if (run_on_other_drivers == "False"
+        if (utils.decode(run_on_other_drivers) == "False"
                 and self.worker.mode == ray.SCRIPT_MODE
                 and driver_id != self.worker.task_driver_id.id()):
             return
diff --git a/python/ray/internal/internal_api.py b/python/ray/internal/internal_api.py
index 062d633ee44bd..7772974319aea 100644
--- a/python/ray/internal/internal_api.py
+++ b/python/ray/internal/internal_api.py
@@ -2,7 +2,7 @@
 from __future__ import division
 from __future__ import print_function
 
-import ray.local_scheduler
+import ray.raylet
 import ray.worker
 from ray import profiling
 
@@ -42,7 +42,4 @@ def free(object_ids, local_only=False, worker=None):
         if len(object_ids) == 0:
             return
 
-        if worker.use_raylet:
-            worker.local_scheduler_client.free(object_ids, local_only)
-        else:
-            raise Exception("Free is not supported in legacy backend.")
+        worker.local_scheduler_client.free(object_ids, local_only)
diff --git a/python/ray/local_scheduler/build/.gitkeep b/python/ray/local_scheduler/build/.gitkeep
deleted file mode 100644
index e69de29bb2d1d..0000000000000
diff --git a/python/ray/local_scheduler/local_scheduler_services.py b/python/ray/local_scheduler/local_scheduler_services.py
deleted file mode 100644
index f7847ce551b0f..0000000000000
--- a/python/ray/local_scheduler/local_scheduler_services.py
+++ /dev/null
@@ -1,133 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import multiprocessing
-import os
-import random
-import subprocess
-import sys
-import time
-
-
-def random_name():
-    return str(random.randint(0, 99999999))
-
-
-def start_local_scheduler(plasma_store_name,
-                          plasma_manager_name=None,
-                          worker_path=None,
-                          plasma_address=None,
-                          node_ip_address="127.0.0.1",
-                          redis_address=None,
-                          use_valgrind=False,
-                          use_profiler=False,
-                          stdout_file=None,
-                          stderr_file=None,
-                          static_resources=None,
-                          num_workers=0):
-    """Start a local scheduler process.
-
-    Args:
-        plasma_store_name (str): The name of the plasma store socket to connect
-            to.
-        plasma_manager_name (str): The name of the plasma manager to connect
-            to. This does not need to be provided, but if it is, then the Redis
-            address must be provided as well.
-        worker_path (str): The path of the worker script to use when the local
-            scheduler starts up new workers.
-        plasma_address (str): The address of the plasma manager to connect to.
-            This is only used by the global scheduler to figure out which
-            plasma managers are connected to which local schedulers.
-        node_ip_address (str): The address of the node that this local
-            scheduler is running on.
-        redis_address (str): The address of the Redis instance to connect to.
-            If this is not provided, then the local scheduler will not connect
-            to Redis.
-        use_valgrind (bool): True if the local scheduler should be started
-            inside of valgrind. If this is True, use_profiler must be False.
-        use_profiler (bool): True if the local scheduler should be started
-            inside a profiler. If this is True, use_valgrind must be False.
-        stdout_file: A file handle opened for writing to redirect stdout to. If
-            no redirection should happen, then this should be None.
-        stderr_file: A file handle opened for writing to redirect stderr to. If
-            no redirection should happen, then this should be None.
-        static_resources: A dictionary specifying the local scheduler's
-            resource capacities. This maps resource names (strings) to
-            integers or floats.
-        num_workers (int): The number of workers that the local scheduler
-            should start.
-
-    Return:
-        A tuple of the name of the local scheduler socket and the process ID of
-            the local scheduler process.
-    """
-    if (plasma_manager_name is None) != (redis_address is None):
-        raise Exception("If one of the plasma_manager_name and the "
-                        "redis_address is provided, then both must be "
-                        "provided.")
-    if use_valgrind and use_profiler:
-        raise Exception("Cannot use valgrind and profiler at the same time.")
-    local_scheduler_executable = os.path.join(
-        os.path.dirname(os.path.abspath(__file__)),
-        "../core/src/local_scheduler/local_scheduler")
-    local_scheduler_name = "/tmp/scheduler{}".format(random_name())
-    command = [
-        local_scheduler_executable, "-s", local_scheduler_name, "-p",
-        plasma_store_name, "-h", node_ip_address, "-n",
-        str(num_workers)
-    ]
-    if plasma_manager_name is not None:
-        command += ["-m", plasma_manager_name]
-    if worker_path is not None:
-        assert plasma_store_name is not None
-        assert plasma_manager_name is not None
-        assert redis_address is not None
-        start_worker_command = ("{} {} "
-                                "--node-ip-address={} "
-                                "--object-store-name={} "
-                                "--object-store-manager-name={} "
-                                "--local-scheduler-name={} "
-                                "--redis-address={}".format(
-                                    sys.executable, worker_path,
-                                    node_ip_address, plasma_store_name,
-                                    plasma_manager_name, local_scheduler_name,
-                                    redis_address))
-        command += ["-w", start_worker_command]
-    if redis_address is not None:
-        command += ["-r", redis_address]
-    if plasma_address is not None:
-        command += ["-a", plasma_address]
-    if static_resources is not None:
-        resource_argument = ""
-        for resource_name, resource_quantity in static_resources.items():
-            assert (isinstance(resource_quantity, int)
-                    or isinstance(resource_quantity, float))
-        resource_argument = ",".join([
-            resource_name + "," + str(resource_quantity)
-            for resource_name, resource_quantity in static_resources.items()
-        ])
-    else:
-        resource_argument = "CPU,{}".format(multiprocessing.cpu_count())
-    command += ["-c", resource_argument]
-
-    if use_valgrind:
-        pid = subprocess.Popen(
-            [
-                "valgrind", "--track-origins=yes", "--leak-check=full",
-                "--show-leak-kinds=all", "--leak-check-heuristics=stdstring",
-                "--error-exitcode=1"
-            ] + command,
-            stdout=stdout_file,
-            stderr=stderr_file)
-        time.sleep(1.0)
-    elif use_profiler:
-        pid = subprocess.Popen(
-            ["valgrind", "--tool=callgrind"] + command,
-            stdout=stdout_file,
-            stderr=stderr_file)
-        time.sleep(1.0)
-    else:
-        pid = subprocess.Popen(command, stdout=stdout_file, stderr=stderr_file)
-        time.sleep(0.1)
-    return local_scheduler_name, pid
diff --git a/python/ray/local_scheduler/test/test.py b/python/ray/local_scheduler/test/test.py
deleted file mode 100644
index b35d609de6e0e..0000000000000
--- a/python/ray/local_scheduler/test/test.py
+++ /dev/null
@@ -1,206 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import numpy as np
-import os
-import signal
-import sys
-import threading
-import time
-import unittest
-
-import ray.local_scheduler as local_scheduler
-import ray.plasma as plasma
-import ray.ray_constants as ray_constants
-import pyarrow as pa
-
-USE_VALGRIND = False
-
-NIL_WORKER_ID = ray_constants.ID_SIZE * b"\xff"
-
-
-def random_object_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-def random_driver_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-def random_task_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-def random_function_id():
-    return local_scheduler.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-class TestLocalSchedulerClient(unittest.TestCase):
-    def setUp(self):
-        # Start Plasma store.
-        plasma_store_name, self.p1 = plasma.start_plasma_store()
-        self.plasma_client = pa.plasma.connect(plasma_store_name, "", 0)
-        # Start a local scheduler.
-        scheduler_name, self.p2 = local_scheduler.start_local_scheduler(
-            plasma_store_name, use_valgrind=USE_VALGRIND)
-        # Connect to the scheduler.
-        self.local_scheduler_client = local_scheduler.LocalSchedulerClient(
-            scheduler_name, NIL_WORKER_ID, False, random_task_id(), False)
-
-    def tearDown(self):
-        # Check that the processes are still alive.
-        self.assertEqual(self.p1.poll(), None)
-        self.assertEqual(self.p2.poll(), None)
-
-        # Kill Plasma.
-        self.p1.kill()
-        # Kill the local scheduler.
-        if USE_VALGRIND:
-            self.p2.send_signal(signal.SIGTERM)
-            self.p2.wait()
-            if self.p2.returncode != 0:
-                os._exit(-1)
-        else:
-            self.p2.kill()
-
-    def test_submit_and_get_task(self):
-        function_id = random_function_id()
-        object_ids = [random_object_id() for i in range(256)]
-        # Create and seal the objects in the object store so that we can
-        # schedule all of the subsequent tasks.
-        for object_id in object_ids:
-            self.plasma_client.create(pa.plasma.ObjectID(object_id.id()), 0)
-            self.plasma_client.seal(pa.plasma.ObjectID(object_id.id()))
-        # Define some arguments to use for the tasks.
-        args_list = [[], [{}], [()], 1 * [1], 10 * [1], 100 * [1], 1000 * [1],
-                     1 * ["a"], 10 * ["a"], 100 * ["a"], 1000 * ["a"], [
-                         1, 1.3, 1 << 100, "hi", u"hi", [1, 2]
-                     ], object_ids[:1], object_ids[:2], object_ids[:3],
-                     object_ids[:4], object_ids[:5], object_ids[:10],
-                     object_ids[:100], object_ids[:256], [1, object_ids[0]], [
-                         object_ids[0], "a"
-                     ], [1, object_ids[0], "a"], [
-                         object_ids[0], 1, object_ids[1], "a"
-                     ], object_ids[:3] + [1, "hi", 2.3] + object_ids[:5],
-                     object_ids + 100 * ["a"] + object_ids]
-
-        for args in args_list:
-            for num_return_vals in [0, 1, 2, 3, 5, 10, 100]:
-                task = local_scheduler.Task(random_driver_id(), function_id,
-                                            args, num_return_vals,
-                                            random_task_id(), 0)
-                # Submit a task.
-                self.local_scheduler_client.submit(task)
-                # Get the task.
-                new_task = self.local_scheduler_client.get_task()
-                self.assertEqual(task.function_id().id(),
-                                 new_task.function_id().id())
-                retrieved_args = new_task.arguments()
-                returns = new_task.returns()
-                self.assertEqual(len(args), len(retrieved_args))
-                self.assertEqual(num_return_vals, len(returns))
-                for i in range(len(retrieved_args)):
-                    if isinstance(args[i], local_scheduler.ObjectID):
-                        self.assertEqual(args[i].id(), retrieved_args[i].id())
-                    else:
-                        self.assertEqual(args[i], retrieved_args[i])
-
-        # Submit all of the tasks.
-        for args in args_list:
-            for num_return_vals in [0, 1, 2, 3, 5, 10, 100]:
-                task = local_scheduler.Task(random_driver_id(), function_id,
-                                            args, num_return_vals,
-                                            random_task_id(), 0)
-                self.local_scheduler_client.submit(task)
-        # Get all of the tasks.
-        for args in args_list:
-            for num_return_vals in [0, 1, 2, 3, 5, 10, 100]:
-                new_task = self.local_scheduler_client.get_task()
-
-    def test_scheduling_when_objects_ready(self):
-        # Create a task and submit it.
-        object_id = random_object_id()
-        task = local_scheduler.Task(random_driver_id(), random_function_id(),
-                                    [object_id], 0, random_task_id(), 0)
-        self.local_scheduler_client.submit(task)
-
-        # Launch a thread to get the task.
-        def get_task():
-            self.local_scheduler_client.get_task()
-
-        t = threading.Thread(target=get_task)
-        t.start()
-        # Sleep to give the thread time to call get_task.
-        time.sleep(0.1)
-        # Create and seal the object ID in the object store. This should
-        # trigger a scheduling event.
-        self.plasma_client.create(pa.plasma.ObjectID(object_id.id()), 0)
-        self.plasma_client.seal(pa.plasma.ObjectID(object_id.id()))
-        # Wait until the thread finishes so that we know the task was
-        # scheduled.
-        t.join()
-
-    def test_scheduling_when_objects_evicted(self):
-        # Create a task with two dependencies and submit it.
-        object_id1 = random_object_id()
-        object_id2 = random_object_id()
-        task = local_scheduler.Task(random_driver_id(), random_function_id(),
-                                    [object_id1, object_id2], 0,
-                                    random_task_id(), 0)
-        self.local_scheduler_client.submit(task)
-
-        # Launch a thread to get the task.
-        def get_task():
-            self.local_scheduler_client.get_task()
-
-        t = threading.Thread(target=get_task)
-        t.start()
-
-        # Make one of the dependencies available.
-        buf = self.plasma_client.create(pa.plasma.ObjectID(object_id1.id()), 1)
-        self.plasma_client.seal(pa.plasma.ObjectID(object_id1.id()))
-        # Release the object.
-        del buf
-        # Check that the thread is still waiting for a task.
-        time.sleep(0.1)
-        self.assertTrue(t.is_alive())
-        # Force eviction of the first dependency.
-        self.plasma_client.evict(plasma.DEFAULT_PLASMA_STORE_MEMORY)
-        # Check that the thread is still waiting for a task.
-        time.sleep(0.1)
-        self.assertTrue(t.is_alive())
-        # Check that the first object dependency was evicted.
-        object1 = self.plasma_client.get_buffers(
-            [pa.plasma.ObjectID(object_id1.id())], timeout_ms=0)
-        self.assertEqual(object1, [None])
-        # Check that the thread is still waiting for a task.
-        time.sleep(0.1)
-        self.assertTrue(t.is_alive())
-
-        # Create the second dependency.
-        self.plasma_client.create(pa.plasma.ObjectID(object_id2.id()), 1)
-        self.plasma_client.seal(pa.plasma.ObjectID(object_id2.id()))
-        # Check that the thread is still waiting for a task.
-        time.sleep(0.1)
-        self.assertTrue(t.is_alive())
-
-        # Create the first dependency again. Both dependencies are now
-        # available.
-        self.plasma_client.create(pa.plasma.ObjectID(object_id1.id()), 1)
-        self.plasma_client.seal(pa.plasma.ObjectID(object_id1.id()))
-
-        # Wait until the thread finishes so that we know the task was
-        # scheduled.
-        t.join()
-
-
-if __name__ == "__main__":
-    if len(sys.argv) > 1:
-        # Pop the argument so we don't mess with unittest's own argument
-        # parser.
-        if sys.argv[-1] == "valgrind":
-            arg = sys.argv.pop()
-            USE_VALGRIND = True
-            print("Using valgrind for tests")
-    unittest.main(verbosity=2)
diff --git a/python/ray/log_monitor.py b/python/ray/log_monitor.py
index 13a62a98a322b..2cd6fc40a0f56 100644
--- a/python/ray/log_monitor.py
+++ b/python/ray/log_monitor.py
@@ -35,11 +35,15 @@ class LogMonitor(object):
             handle for that file.
     """
 
-    def __init__(self, redis_ip_address, redis_port, node_ip_address):
+    def __init__(self,
+                 redis_ip_address,
+                 redis_port,
+                 node_ip_address,
+                 redis_password=None):
         """Initialize the log monitor object."""
         self.node_ip_address = node_ip_address
         self.redis_client = redis.StrictRedis(
-            host=redis_ip_address, port=redis_port)
+            host=redis_ip_address, port=redis_port, password=redis_password)
         self.log_files = {}
         self.log_file_handles = {}
         self.files_to_ignore = set()
@@ -130,6 +134,12 @@ def run(self):
         required=True,
         type=str,
         help="The IP address of the node this process is on.")
+    parser.add_argument(
+        "--redis-password",
+        required=False,
+        type=str,
+        default=None,
+        help="the password to use for Redis")
     parser.add_argument(
         "--logging-level",
         required=False,
@@ -151,6 +161,9 @@ def run(self):
     redis_ip_address = get_ip_address(args.redis_address)
     redis_port = get_port(args.redis_address)
 
-    log_monitor = LogMonitor(redis_ip_address, redis_port,
-                             args.node_ip_address)
+    log_monitor = LogMonitor(
+        redis_ip_address,
+        redis_port,
+        args.node_ip_address,
+        redis_password=args.redis_password)
     log_monitor.run()
diff --git a/python/ray/memory_monitor.py b/python/ray/memory_monitor.py
new file mode 100644
index 0000000000000..a52f98d7077df
--- /dev/null
+++ b/python/ray/memory_monitor.py
@@ -0,0 +1,81 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import logging
+import os
+import time
+
+try:
+    import psutil
+except ImportError:
+    psutil = None
+
+logger = logging.getLogger(__name__)
+
+
+class RayOutOfMemoryError(Exception):
+    def __init__(self, msg):
+        Exception.__init__(self, msg)
+
+    @staticmethod
+    def get_message(used_gb, total_gb, threshold):
+        pids = psutil.pids()
+        proc_stats = []
+        for pid in pids:
+            proc = psutil.Process(pid)
+            proc_stats.append((proc.memory_info().rss, pid, proc.cmdline()))
+        proc_str = "PID\tMEM\tCOMMAND"
+        for rss, pid, cmdline in sorted(proc_stats, reverse=True)[:5]:
+            proc_str += "\n{}\t{}GB\t{}".format(
+                pid, round(rss / 1e9, 2), " ".join(cmdline)[:100].strip())
+        return ("More than {}% of the memory on ".format(int(
+            100 * threshold)) + "node {} is used ({} / {} GB). ".format(
+                os.uname()[1], round(used_gb, 2), round(total_gb, 2)) +
+                "The top 5 memory consumers are:\n\n{}".format(proc_str) +
+                "\n\nIn addition, ~{} GB of shared memory is ".format(
+                    round(psutil.virtual_memory().shared / 1e9, 2)) +
+                "currently being used by the Ray object store. You can set "
+                "the object store size with the `object_store_memory` "
+                "parameter when starting Ray, and the max Redis size with "
+                "`redis_max_memory`.")
+
+
+class MemoryMonitor(object):
+    """Helper class for raising errors on low memory.
+
+    This presents a much cleaner error message to users than what would happen
+    if we actually ran out of memory.
+    """
+
+    def __init__(self, error_threshold=0.95, check_interval=1):
+        # Note: it takes ~50us to check the memory usage through psutil, so
+        # throttle this check at most once a second or so.
+        self.check_interval = check_interval
+        self.last_checked = time.time()
+        self.error_threshold = error_threshold
+        if not psutil:
+            logger.warning(
+                "WARNING: Not monitoring node memory since `psutil` is not "
+                "installed. Install this with `pip install psutil` "
+                "(or ray[debug]) to enable debugging of memory-related "
+                "crashes.")
+
+    def raise_if_low_memory(self):
+        if not psutil:
+            return  # nothing we can do
+
+        if "RAY_DEBUG_DISABLE_MEMORY_MONITOR" in os.environ:
+            return  # escape hatch, not intended for user use
+
+        if time.time() - self.last_checked > self.check_interval:
+            self.last_checked = time.time()
+            total_gb = psutil.virtual_memory().total / 1e9
+            used_gb = total_gb - psutil.virtual_memory().available / 1e9
+            if used_gb > total_gb * self.error_threshold:
+                raise RayOutOfMemoryError(
+                    RayOutOfMemoryError.get_message(used_gb, total_gb,
+                                                    self.error_threshold))
+            else:
+                logger.debug("Memory usage is {} / {}".format(
+                    used_gb, total_gb))
diff --git a/python/ray/monitor.py b/python/ray/monitor.py
index e5c2279b72333..a37f75de7cf1b 100644
--- a/python/ray/monitor.py
+++ b/python/ray/monitor.py
@@ -3,11 +3,9 @@
 from __future__ import print_function
 
 import argparse
-import binascii
 import logging
 import os
 import time
-from collections import Counter, defaultdict
 import traceback
 
 import redis
@@ -20,27 +18,6 @@
 import ray.ray_constants as ray_constants
 from ray.services import get_ip_address, get_port
 from ray.utils import binary_to_hex, binary_to_object_id, hex_to_binary
-from ray.worker import NIL_ACTOR_ID
-
-# These variables must be kept in sync with the C codebase.
-# common/common.h
-NIL_ID = b"\xff" * ray_constants.ID_SIZE
-
-# common/task.h
-TASK_STATUS_LOST = 32
-
-# common/redis_module/ray_redis_module.cc
-OBJECT_INFO_PREFIX = b"OI:"
-OBJECT_LOCATION_PREFIX = b"OL:"
-TASK_TABLE_PREFIX = b"TT:"
-DB_CLIENT_PREFIX = b"CL:"
-DB_CLIENT_TABLE_NAME = b"db_clients"
-
-# local_scheduler/local_scheduler.h
-LOCAL_SCHEDULER_CLIENT_TYPE = b"local_scheduler"
-
-# plasma/plasma_manager.cc
-PLASMA_MANAGER_CLIENT_TYPE = b"plasma_manager"
 
 # Set up logging.
 logger = logging.getLogger(__name__)
@@ -55,45 +32,24 @@ class Monitor(object):
 
     Attributes:
         redis: A connection to the Redis server.
-        use_raylet: A bool indicating whether to use the raylet code path or
-            not.
         subscribe_client: A pubsub client for the Redis server. This is used to
             receive notifications about failed components.
-        dead_local_schedulers: A set of the local scheduler IDs of all of the
-            local schedulers that were up at one point and have died since
-            then.
-        live_plasma_managers: A counter mapping live plasma manager IDs to the
-            number of heartbeats that have passed since we last heard from that
-            plasma manager. A plasma manager is live if we received a heartbeat
-            from it at any point, and if it has not timed out.
-        dead_plasma_managers: A set of the plasma manager IDs of all the plasma
-            managers that were up at one point and have died since then.
     """
 
-    def __init__(self, redis_address, redis_port, autoscaling_config):
+    def __init__(self,
+                 redis_address,
+                 redis_port,
+                 autoscaling_config,
+                 redis_password=None):
         # Initialize the Redis clients.
         self.state = ray.experimental.state.GlobalState()
-        self.state._initialize_global_state(redis_address, redis_port)
-        self.use_raylet = self.state.use_raylet
+        self.state._initialize_global_state(
+            redis_address, redis_port, redis_password=redis_password)
         self.redis = redis.StrictRedis(
-            host=redis_address, port=redis_port, db=0)
+            host=redis_address, port=redis_port, db=0, password=redis_password)
         # Setup subscriptions to the primary Redis server and the Redis shards.
         self.primary_subscribe_client = self.redis.pubsub(
             ignore_subscribe_messages=True)
-        if self.use_raylet:
-            self.shard_subscribe_clients = []
-            for redis_client in self.state.redis_clients:
-                subscribe_client = redis_client.pubsub(
-                    ignore_subscribe_messages=True)
-                self.shard_subscribe_clients.append(subscribe_client)
-        else:
-            # We don't need to subscribe to the shards in legacy Ray.
-            self.shard_subscribe_clients = []
-        # Initialize data structures to keep track of the active database
-        # clients.
-        self.dead_local_schedulers = set()
-        self.live_plasma_managers = Counter()
-        self.dead_plasma_managers = set()
         # Keep a mapping from local scheduler client ID to IP address to use
         # for updating the load metrics.
         self.local_scheduler_id_to_ip_map = {}
@@ -118,7 +74,9 @@ def __init__(self, redis_address, redis_port, autoscaling_config):
             else:
                 addr_port = addr_port[0].split(b":")
                 self.redis_shard = redis.StrictRedis(
-                    host=addr_port[0], port=addr_port[1])
+                    host=addr_port[0],
+                    port=addr_port[1],
+                    password=redis_password)
                 try:
                     self.redis_shard.execute_command("HEAD.FLUSH 0")
                 except redis.exceptions.ResponseError as e:
@@ -127,367 +85,50 @@ def __init__(self, redis_address, redis_port, autoscaling_config):
                             str(e)))
                     self.issue_gcs_flushes = False
 
-    def subscribe(self, channel, primary=True):
-        """Subscribe to the given channel.
+    def subscribe(self, channel):
+        """Subscribe to the given channel on the primary Redis shard.
 
         Args:
             channel (str): The channel to subscribe to.
-            primary: If True, then we only subscribe to the primary Redis
-                shard. Otherwise we subscribe to all of the other shards but
-                not the primary.
 
         Raises:
             Exception: An exception is raised if the subscription fails.
         """
-        if primary:
-            self.primary_subscribe_client.subscribe(channel)
-        else:
-            for subscribe_client in self.shard_subscribe_clients:
-                subscribe_client.subscribe(channel)
-
-    def cleanup_task_table(self):
-        """Clean up global state for failed local schedulers.
+        self.primary_subscribe_client.subscribe(channel)
 
-        This marks any tasks that were scheduled on dead local schedulers as
-        TASK_STATUS_LOST. A local scheduler is deemed dead if it is in
-        self.dead_local_schedulers.
-        """
-        tasks = self.state.task_table()
-        num_tasks_updated = 0
-        for task_id, task in tasks.items():
-            # See if the corresponding local scheduler is alive.
-            if task["LocalSchedulerID"] not in self.dead_local_schedulers:
-                continue
-
-            # Remove dummy objects returned by actor tasks from any plasma
-            # manager. Although the objects may still exist in that object
-            # store, this deletion makes them effectively unreachable by any
-            # local scheduler connected to a different store.
-            # TODO(swang): Actually remove the objects from the object store,
-            # so that the reconstructed actor can reuse the same object store.
-            if hex_to_binary(task["TaskSpec"]["ActorID"]) != NIL_ACTOR_ID:
-                dummy_object_id = task["TaskSpec"]["ReturnObjectIDs"][-1]
-                obj = self.state.object_table(dummy_object_id)
-                manager_ids = obj["ManagerIDs"]
-                if manager_ids is not None:
-                    # The dummy object should exist on at most one plasma
-                    # manager, the manager associated with the local scheduler
-                    # that died.
-                    assert len(manager_ids) <= 1
-                    # Remove the dummy object from the plasma manager
-                    # associated with the dead local scheduler, if any.
-                    for manager in manager_ids:
-                        ok = self.state._execute_command(
-                            dummy_object_id, "RAY.OBJECT_TABLE_REMOVE",
-                            dummy_object_id.id(), hex_to_binary(manager))
-                        if ok != b"OK":
-                            logger.warn("Failed to remove object location for "
-                                        "dead plasma manager.")
-
-            # If the task is scheduled on a dead local scheduler, mark the
-            # task as lost.
-            key = binary_to_object_id(hex_to_binary(task_id))
-            ok = self.state._execute_command(
-                key, "RAY.TASK_TABLE_UPDATE", hex_to_binary(task_id),
-                ray.experimental.state.TASK_STATUS_LOST, NIL_ID,
-                task["ExecutionDependenciesString"], task["SpillbackCount"])
-            if ok != b"OK":
-                logger.warn("Failed to update lost task for dead scheduler.")
-            num_tasks_updated += 1
-
-        if num_tasks_updated > 0:
-            logger.warn("Marked {} tasks as lost.".format(num_tasks_updated))
-
-    def cleanup_object_table(self):
-        """Clean up global state for failed plasma managers.
-
-        This removes dead plasma managers from any location entries in the
-        object table. A plasma manager is deemed dead if it is in
-        self.dead_plasma_managers.
-        """
-        # TODO(swang): Also kill the associated plasma store, since it's no
-        # longer reachable without a plasma manager.
-        objects = self.state.object_table()
-        num_objects_removed = 0
-        for object_id, obj in objects.items():
-            manager_ids = obj["ManagerIDs"]
-            if manager_ids is None:
-                continue
-            for manager in manager_ids:
-                if manager in self.dead_plasma_managers:
-                    # If the object was on a dead plasma manager, remove that
-                    # location entry.
-                    ok = self.state._execute_command(
-                        object_id, "RAY.OBJECT_TABLE_REMOVE", object_id.id(),
-                        hex_to_binary(manager))
-                    if ok != b"OK":
-                        logger.warn("Failed to remove object location for "
-                                    "dead plasma manager.")
-                    num_objects_removed += 1
-        if num_objects_removed > 0:
-            logger.warn("Marked {} objects as lost."
-                        .format(num_objects_removed))
-
-    def scan_db_client_table(self):
-        """Scan the database client table for dead clients.
-
-        After subscribing to the client table, it's necessary to call this
-        before reading any messages from the subscription channel. This ensures
-        that we do not miss any notifications for deleted clients that occurred
-        before we subscribed.
-        """
-        # Exit if we are using the raylet code path because client_table is
-        # implemented differently. TODO(rkn): Fix this.
-        if self.use_raylet:
-            return
-
-        clients = self.state.client_table()
-        for node_ip_address, node_clients in clients.items():
-            for client in node_clients:
-                db_client_id = client["DBClientID"]
-                client_type = client["ClientType"]
-                if client["Deleted"]:
-                    if client_type == LOCAL_SCHEDULER_CLIENT_TYPE:
-                        self.dead_local_schedulers.add(db_client_id)
-                    elif client_type == PLASMA_MANAGER_CLIENT_TYPE:
-                        self.dead_plasma_managers.add(db_client_id)
-
-    def db_client_notification_handler(self, unused_channel, data):
-        """Handle a notification from the db_client table from Redis.
-
-        This handler processes notifications from the db_client table.
-        Notifications should be parsed using the SubscribeToDBClientTableReply
-        flatbuffer. Deletions are processed, insertions are ignored. Cleanup of
-        the associated state in the state tables should be handled by the
-        caller.
-        """
-        notification_object = (ray.gcs_utils.SubscribeToDBClientTableReply.
-                               GetRootAsSubscribeToDBClientTableReply(data, 0))
-        db_client_id = binary_to_hex(notification_object.DbClientId())
-        client_type = notification_object.ClientType()
-        is_insertion = notification_object.IsInsertion()
-
-        # If the update was an insertion, we ignore it.
-        if is_insertion:
-            return
-
-        # If the update was a deletion, add them to our accounting for dead
-        # local schedulers and plasma managers.
-        logger.warn("Removed {}, client ID {}".format(client_type,
-                                                      db_client_id))
-        if client_type == LOCAL_SCHEDULER_CLIENT_TYPE:
-            if db_client_id not in self.dead_local_schedulers:
-                self.dead_local_schedulers.add(db_client_id)
-        elif client_type == PLASMA_MANAGER_CLIENT_TYPE:
-            if db_client_id not in self.dead_plasma_managers:
-                self.dead_plasma_managers.add(db_client_id)
-            # Stop tracking this plasma manager's heartbeats, since it's
-            # already dead.
-            del self.live_plasma_managers[db_client_id]
-
-    def local_scheduler_info_handler(self, unused_channel, data):
-        """Handle a local scheduler heartbeat from Redis."""
-
-        message = (ray.gcs_utils.LocalSchedulerInfoMessage.
-                   GetRootAsLocalSchedulerInfoMessage(data, 0))
-        num_resources = message.DynamicResourcesLength()
-        static_resources = {}
-        dynamic_resources = {}
-        for i in range(num_resources):
-            dyn = message.DynamicResources(i)
-            static = message.StaticResources(i)
-            dynamic_resources[dyn.Key().decode("utf-8")] = dyn.Value()
-            static_resources[static.Key().decode("utf-8")] = static.Value()
-
-        # Update the load metrics for this local scheduler.
-        client_id = binascii.hexlify(message.DbClientId()).decode("utf-8")
-        ip = self.local_scheduler_id_to_ip_map.get(client_id)
-        if ip:
-            self.load_metrics.update(ip, static_resources, dynamic_resources)
-        else:
-            logger.warning(
-                "Warning: could not find ip for client {} in {}.".format(
-                    client_id, self.local_scheduler_id_to_ip_map))
-
-    def xray_heartbeat_handler(self, unused_channel, data):
-        """Handle an xray heartbeat message from Redis."""
+    def xray_heartbeat_batch_handler(self, unused_channel, data):
+        """Handle an xray heartbeat batch message from Redis."""
 
         gcs_entries = ray.gcs_utils.GcsTableEntry.GetRootAsGcsTableEntry(
             data, 0)
         heartbeat_data = gcs_entries.Entries(0)
-        message = ray.gcs_utils.HeartbeatTableData.GetRootAsHeartbeatTableData(
-            heartbeat_data, 0)
-        num_resources = message.ResourcesAvailableLabelLength()
-        static_resources = {}
-        dynamic_resources = {}
-        for i in range(num_resources):
-            dyn = message.ResourcesAvailableLabel(i)
-            static = message.ResourcesTotalLabel(i)
-            dynamic_resources[dyn] = message.ResourcesAvailableCapacity(i)
-            static_resources[static] = message.ResourcesTotalCapacity(i)
-
-        # Update the load metrics for this local scheduler.
-        client_id = ray.utils.binary_to_hex(message.ClientId())
-        ip = self.local_scheduler_id_to_ip_map.get(client_id)
-        if ip:
-            self.load_metrics.update(ip, static_resources, dynamic_resources)
-        else:
-            print("Warning: could not find ip for client {} in {}.".format(
-                client_id, self.local_scheduler_id_to_ip_map))
-
-    def plasma_manager_heartbeat_handler(self, unused_channel, data):
-        """Handle a plasma manager heartbeat from Redis.
-
-        This resets the number of heartbeats that we've missed from this plasma
-        manager.
-        """
-        # The first ray_constants.ID_SIZE characters are the client ID.
-        db_client_id = data[:ray_constants.ID_SIZE]
-        # Reset the number of heartbeats that we've missed from this plasma
-        # manager.
-        self.live_plasma_managers[db_client_id] = 0
-
-    def _entries_for_driver_in_shard(self, driver_id, redis_shard_index):
-        """Collect IDs of control-state entries for a driver from a shard.
-
-        Args:
-            driver_id: The ID of the driver.
-            redis_shard_index: The index of the Redis shard to query.
-
-        Returns:
-            Lists of IDs: (returned_object_ids, task_ids, put_objects). The
-                first two are relevant to the driver and are safe to delete.
-                The last contains all "put" objects in this redis shard; each
-                element is an (object_id, corresponding task_id) pair.
-        """
-        # TODO(zongheng): consider adding save & restore functionalities.
-        redis = self.state.redis_clients[redis_shard_index]
-        task_table_infos = {}  # task id -> TaskInfo messages
-
-        # Scan the task table & filter to get the list of tasks belong to this
-        # driver.  Use a cursor in order not to block the redis shards.
-        for key in redis.scan_iter(match=TASK_TABLE_PREFIX + b"*"):
-            entry = redis.hgetall(key)
-            task_info = ray.gcs_utils.TaskInfo.GetRootAsTaskInfo(
-                entry[b"TaskSpec"], 0)
-            if driver_id != task_info.DriverId():
-                # Ignore tasks that aren't from this driver.
-                continue
-            task_table_infos[task_info.TaskId()] = task_info
-
-        # Get the list of objects returned by these tasks.  Note these might
-        # not belong to this redis shard.
-        returned_object_ids = []
-        for task_info in task_table_infos.values():
-            returned_object_ids.extend([
-                task_info.Returns(i) for i in range(task_info.ReturnsLength())
-            ])
-
-        # Also record all the ray.put()'d objects.
-        put_objects = []
-        for key in redis.scan_iter(match=OBJECT_INFO_PREFIX + b"*"):
-            entry = redis.hgetall(key)
-            if entry[b"is_put"] == "0":
-                continue
-            object_id = key.split(OBJECT_INFO_PREFIX)[1]
-            task_id = entry[b"task"]
-            put_objects.append((object_id, task_id))
-
-        return returned_object_ids, task_table_infos.keys(), put_objects
-
-    def _clean_up_entries_from_shard(self, object_ids, task_ids, shard_index):
-        redis = self.state.redis_clients[shard_index]
-        # Clean up (in the future, save) entries for non-empty objects.
-        object_ids_locs = set()
-        object_ids_infos = set()
-        for object_id in object_ids:
-            # OL.
-            obj_loc = redis.zrange(OBJECT_LOCATION_PREFIX + object_id, 0, -1)
-            if obj_loc:
-                object_ids_locs.add(object_id)
-            # OI.
-            obj_info = redis.hgetall(OBJECT_INFO_PREFIX + object_id)
-            if obj_info:
-                object_ids_infos.add(object_id)
-
-        # Form the redis keys to delete.
-        keys = [TASK_TABLE_PREFIX + k for k in task_ids]
-        keys.extend([OBJECT_LOCATION_PREFIX + k for k in object_ids_locs])
-        keys.extend([OBJECT_INFO_PREFIX + k for k in object_ids_infos])
-
-        if not keys:
-            return
-        # Remove with best effort.
-        num_deleted = redis.delete(*keys)
-        logger.info(
-            "Removed {} dead redis entries of the driver from redis shard {}.".
-            format(num_deleted, shard_index))
-        if num_deleted != len(keys):
-            logger.warning(
-                "Failed to remove {} relevant redis entries"
-                " from redis shard {}.".format(len(keys) - num_deleted))
-
-    def _clean_up_entries_for_driver(self, driver_id):
-        """Remove this driver's object/task entries from all redis shards.
-
-        Specifically, removes control-state entries of:
-            * all objects (OI and OL entries) created by `ray.put()` from the
-              driver
-            * all tasks belonging to the driver.
-        """
-        # TODO(zongheng): handle function_table, client_table, log_files --
-        # these are in the metadata redis server, not in the shards.
-        driver_object_ids = []
-        driver_task_ids = []
-        all_put_objects = []
-
-        # Collect relevant ids.
-        # TODO(zongheng): consider parallelizing this loop.
-        for shard_index in range(len(self.state.redis_clients)):
-            returned_object_ids, task_ids, put_objects = \
-                self._entries_for_driver_in_shard(driver_id, shard_index)
-            driver_object_ids.extend(returned_object_ids)
-            driver_task_ids.extend(task_ids)
-            all_put_objects.extend(put_objects)
-
-        # For the put objects, keep those from relevant tasks.
-        driver_task_ids_set = set(driver_task_ids)
-        for object_id, task_id in all_put_objects:
-            if task_id in driver_task_ids_set:
-                driver_object_ids.append(object_id)
-
-        # Partition IDs and distribute to shards.
-        object_ids_per_shard = defaultdict(list)
-        task_ids_per_shard = defaultdict(list)
-
-        def ToShardIndex(index):
-            return binary_to_object_id(index).redis_shard_hash() % len(
-                self.state.redis_clients)
-
-        for object_id in driver_object_ids:
-            object_ids_per_shard[ToShardIndex(object_id)].append(object_id)
-        for task_id in driver_task_ids:
-            task_ids_per_shard[ToShardIndex(task_id)].append(task_id)
-
-        # TODO(zongheng): consider parallelizing this loop.
-        for shard_index in range(len(self.state.redis_clients)):
-            self._clean_up_entries_from_shard(
-                object_ids_per_shard[shard_index],
-                task_ids_per_shard[shard_index], shard_index)
-
-    def driver_removed_handler(self, unused_channel, data):
-        """Handle a notification that a driver has been removed.
 
-        This releases any GPU resources that were reserved for that driver in
-        Redis.
-        """
-        message = ray.gcs_utils.DriverTableMessage.GetRootAsDriverTableMessage(
-            data, 0)
-        driver_id = message.DriverId()
-        logger.info("Driver {} has been removed.".format(
-            binary_to_hex(driver_id)))
-
-        self._clean_up_entries_for_driver(driver_id)
+        message = (ray.gcs_utils.HeartbeatBatchTableData.
+                   GetRootAsHeartbeatBatchTableData(heartbeat_data, 0))
+
+        for j in range(message.BatchLength()):
+            heartbeat_message = message.Batch(j)
+
+            num_resources = heartbeat_message.ResourcesAvailableLabelLength()
+            static_resources = {}
+            dynamic_resources = {}
+            for i in range(num_resources):
+                dyn = heartbeat_message.ResourcesAvailableLabel(i)
+                static = heartbeat_message.ResourcesTotalLabel(i)
+                dynamic_resources[dyn] = (
+                    heartbeat_message.ResourcesAvailableCapacity(i))
+                static_resources[static] = (
+                    heartbeat_message.ResourcesTotalCapacity(i))
+
+            # Update the load metrics for this local scheduler.
+            client_id = ray.utils.binary_to_hex(heartbeat_message.ClientId())
+            ip = self.local_scheduler_id_to_ip_map.get(client_id)
+            if ip:
+                self.load_metrics.update(ip, static_resources,
+                                         dynamic_resources)
+            else:
+                print("Warning: could not find ip for client {} in {}.".format(
+                    client_id, self.local_scheduler_id_to_ip_map))
 
     def _xray_clean_up_entries_for_driver(self, driver_id):
         """Remove this driver's object/task entries from redis.
@@ -507,10 +148,8 @@ def _xray_clean_up_entries_for_driver(self, driver_id):
         task_table_objects = self.state.task_table()
         driver_id_hex = binary_to_hex(driver_id)
         driver_task_id_bins = set()
-        for task_id_hex in task_table_objects:
-            if len(task_table_objects[task_id_hex]) == 0:
-                continue
-            task_table_object = task_table_objects[task_id_hex][0]["TaskSpec"]
+        for task_id_hex, task_info in task_table_objects.items():
+            task_table_object = task_info["TaskSpec"]
             task_driver_id_hex = task_table_object["DriverID"]
             if driver_id_hex != task_driver_id_hex:
                 # Ignore tasks that aren't from this driver.
@@ -520,9 +159,8 @@ def _xray_clean_up_entries_for_driver(self, driver_id):
         # Get objects associated with the driver.
         object_table_objects = self.state.object_table()
         driver_object_id_bins = set()
-        for object_id, object_table_object in object_table_objects.items():
-            assert len(object_table_object) > 0
-            task_id_bin = ray.local_scheduler.compute_task_id(object_id).id()
+        for object_id, _ in object_table_objects.items():
+            task_id_bin = ray.raylet.compute_task_id(object_id).id()
             if task_id_bin in driver_task_id_bins:
                 driver_object_id_bins.add(object_id.id())
 
@@ -580,8 +218,7 @@ def process_messages(self, max_messages=10000):
             max_messages: The maximum number of messages to process before
                 returning.
         """
-        subscribe_clients = (
-            [self.primary_subscribe_client] + self.shard_subscribe_clients)
+        subscribe_clients = [self.primary_subscribe_client]
         for subscribe_client in subscribe_clients:
             for _ in range(max_messages):
                 message = subscribe_client.get_message()
@@ -595,22 +232,9 @@ def process_messages(self, max_messages=10000):
 
                 # Determine the appropriate message handler.
                 message_handler = None
-                if channel == ray.gcs_utils.PLASMA_MANAGER_HEARTBEAT_CHANNEL:
-                    # The message was a heartbeat from a plasma manager.
-                    message_handler = self.plasma_manager_heartbeat_handler
-                elif channel == ray.gcs_utils.LOCAL_SCHEDULER_INFO_CHANNEL:
-                    # The message was a heartbeat from a local scheduler
-                    message_handler = self.local_scheduler_info_handler
-                elif channel == DB_CLIENT_TABLE_NAME:
-                    # The message was a notification from the db_client table.
-                    message_handler = self.db_client_notification_handler
-                elif channel == ray.gcs_utils.DRIVER_DEATH_CHANNEL:
-                    # The message was a notification that a driver was removed.
-                    logger.info("message-handler: driver_removed_handler")
-                    message_handler = self.driver_removed_handler
-                elif channel == ray.gcs_utils.XRAY_HEARTBEAT_CHANNEL:
+                if channel == ray.gcs_utils.XRAY_HEARTBEAT_BATCH_CHANNEL:
                     # Similar functionality as local scheduler info channel
-                    message_handler = self.xray_heartbeat_handler
+                    message_handler = self.xray_heartbeat_batch_handler
                 elif channel == ray.gcs_utils.XRAY_DRIVER_CHANNEL:
                     # Handles driver death.
                     message_handler = self.xray_driver_removed_handler
@@ -622,10 +246,7 @@ def process_messages(self, max_messages=10000):
                 message_handler(channel, data)
 
     def update_local_scheduler_map(self):
-        if self.use_raylet:
-            local_schedulers = self.state.client_table()
-        else:
-            local_schedulers = self.state.local_schedulers()
+        local_schedulers = self.state.client_table()
         self.local_scheduler_id_to_ip_map = {}
         for local_scheduler_info in local_schedulers:
             client_id = local_scheduler_info.get("DBClientID") or \
@@ -673,33 +294,11 @@ def run(self):
         clients and cleaning up state accordingly.
         """
         # Initialize the subscription channel.
-        self.subscribe(DB_CLIENT_TABLE_NAME)
-        self.subscribe(ray.gcs_utils.LOCAL_SCHEDULER_INFO_CHANNEL)
-        self.subscribe(ray.gcs_utils.PLASMA_MANAGER_HEARTBEAT_CHANNEL)
-        self.subscribe(ray.gcs_utils.DRIVER_DEATH_CHANNEL)
-        self.subscribe(ray.gcs_utils.XRAY_HEARTBEAT_CHANNEL, primary=False)
+        self.subscribe(ray.gcs_utils.XRAY_HEARTBEAT_BATCH_CHANNEL)
         self.subscribe(ray.gcs_utils.XRAY_DRIVER_CHANNEL)
 
-        # Scan the database table for dead database clients. NOTE: This must be
-        # called before reading any messages from the subscription channel.
-        # This ensures that we start in a consistent state, since we may have
-        # missed notifications that were sent before we connected to the
-        # subscription channel.
-        self.scan_db_client_table()
-        # If there were any dead clients at startup, clean up the associated
-        # state in the state tables.
-        if len(self.dead_local_schedulers) > 0:
-            self.cleanup_task_table()
-        if len(self.dead_plasma_managers) > 0:
-            self.cleanup_object_table()
-
-        num_plasma_managers = len(self.live_plasma_managers) + len(
-            self.dead_plasma_managers)
-
-        logger.debug("{} dead local schedulers, {} plasma managers total, {} "
-                     "dead plasma managers".format(
-                         len(self.dead_local_schedulers), num_plasma_managers,
-                         len(self.dead_plasma_managers)))
+        # TODO(rkn): If there were any dead clients at startup, we should clean
+        # up the associated state in the state tables.
 
         # Handle messages from the subscription channels.
         while True:
@@ -713,43 +312,9 @@ def run(self):
 
             self._maybe_flush_gcs()
 
-            # Record how many dead local schedulers and plasma managers we had
-            # at the beginning of this round.
-            num_dead_local_schedulers = len(self.dead_local_schedulers)
-            num_dead_plasma_managers = len(self.dead_plasma_managers)
-
             # Process a round of messages.
             self.process_messages()
 
-            # If any new local schedulers or plasma managers were marked as
-            # dead in this round, clean up the associated state.
-            if len(self.dead_local_schedulers) > num_dead_local_schedulers:
-                self.cleanup_task_table()
-            if len(self.dead_plasma_managers) > num_dead_plasma_managers:
-                self.cleanup_object_table()
-
-            # Handle plasma managers that timed out during this round.
-            plasma_manager_ids = list(self.live_plasma_managers.keys())
-            for plasma_manager_id in plasma_manager_ids:
-                if ((self.live_plasma_managers[plasma_manager_id]) >=
-                        ray._config.num_heartbeats_timeout()):
-                    logger.warn("Timed out {}"
-                                .format(PLASMA_MANAGER_CLIENT_TYPE))
-                    # Remove the plasma manager from the managers whose
-                    # heartbeats we're tracking.
-                    del self.live_plasma_managers[plasma_manager_id]
-                    # Remove the plasma manager from the db_client table. The
-                    # corresponding state in the object table will be cleaned
-                    # up once we receive the notification for this db_client
-                    # deletion.
-                    self.redis.execute_command("RAY.DISCONNECT",
-                                               plasma_manager_id)
-
-            # Increment the number of heartbeats that we've missed from each
-            # plasma manager.
-            for plasma_manager_id in self.live_plasma_managers:
-                self.live_plasma_managers[plasma_manager_id] += 1
-
             # Wait for a heartbeat interval before processing the next round of
             # messages.
             time.sleep(ray._config.heartbeat_timeout_milliseconds() * 1e-3)
@@ -773,6 +338,12 @@ def run(self):
         required=False,
         type=str,
         help="the path to the autoscaling config file")
+    parser.add_argument(
+        "--redis-password",
+        required=False,
+        type=str,
+        default=None,
+        help="the password to use for Redis")
     parser.add_argument(
         "--logging-level",
         required=False,
@@ -798,7 +369,11 @@ def run(self):
     else:
         autoscaling_config = None
 
-    monitor = Monitor(redis_ip_address, redis_port, autoscaling_config)
+    monitor = Monitor(
+        redis_ip_address,
+        redis_port,
+        autoscaling_config,
+        redis_password=args.redis_password)
 
     try:
         monitor.run()
@@ -810,6 +385,5 @@ def run(self):
         message = "The monitor failed with the following error:\n{}".format(
             traceback_str)
         ray.utils.push_error_to_driver_through_redis(
-            redis_client, monitor.use_raylet, ray_constants.MONITOR_DIED_ERROR,
-            message)
+            redis_client, ray_constants.MONITOR_DIED_ERROR, message)
         raise e
diff --git a/python/ray/plasma/__init__.py b/python/ray/plasma/__init__.py
index 1ecd0c2af2dcb..6c6c18b7c555f 100644
--- a/python/ray/plasma/__init__.py
+++ b/python/ray/plasma/__init__.py
@@ -2,9 +2,6 @@
 from __future__ import division
 from __future__ import print_function
 
-from ray.plasma.plasma import (start_plasma_store, start_plasma_manager,
-                               DEFAULT_PLASMA_STORE_MEMORY)
+from ray.plasma.plasma import start_plasma_store, DEFAULT_PLASMA_STORE_MEMORY
 
-__all__ = [
-    "start_plasma_store", "start_plasma_manager", "DEFAULT_PLASMA_STORE_MEMORY"
-]
+__all__ = ["start_plasma_store", "DEFAULT_PLASMA_STORE_MEMORY"]
diff --git a/python/ray/plasma/plasma.py b/python/ray/plasma/plasma.py
index 60870c2b20210..53b2434260c86 100644
--- a/python/ray/plasma/plasma.py
+++ b/python/ray/plasma/plasma.py
@@ -3,31 +3,27 @@
 from __future__ import print_function
 
 import os
-import random
 import subprocess
 import sys
 import time
 
-__all__ = [
-    "start_plasma_store", "start_plasma_manager", "DEFAULT_PLASMA_STORE_MEMORY"
-]
+from ray.tempfile_services import get_object_store_socket_name
+
+__all__ = ["start_plasma_store", "DEFAULT_PLASMA_STORE_MEMORY"]
 
 PLASMA_WAIT_TIMEOUT = 2**30
 
 DEFAULT_PLASMA_STORE_MEMORY = 10**9
 
 
-def random_name():
-    return str(random.randint(0, 99999999))
-
-
 def start_plasma_store(plasma_store_memory=DEFAULT_PLASMA_STORE_MEMORY,
                        use_valgrind=False,
                        use_profiler=False,
                        stdout_file=None,
                        stderr_file=None,
                        plasma_directory=None,
-                       huge_pages=False):
+                       huge_pages=False,
+                       socket_name=None):
     """Start a plasma store process.
 
     Args:
@@ -43,6 +39,8 @@ def start_plasma_store(plasma_store_memory=DEFAULT_PLASMA_STORE_MEMORY,
             be created.
         huge_pages: a boolean flag indicating whether to start the
             Object Store with hugetlbfs support. Requires plasma_directory.
+        socket_name (str): If provided, it will specify the socket
+            name used by the plasma store.
 
     Return:
         A tuple of the name of the plasma store socket and the process ID of
@@ -66,7 +64,7 @@ def start_plasma_store(plasma_store_memory=DEFAULT_PLASMA_STORE_MEMORY,
     plasma_store_executable = os.path.join(
         os.path.abspath(os.path.dirname(__file__)),
         "../core/src/plasma/plasma_store_server")
-    plasma_store_name = "/tmp/plasma_store{}".format(random_name())
+    plasma_store_name = socket_name or get_object_store_socket_name()
     command = [
         plasma_store_executable, "-s", plasma_store_name, "-m",
         str(plasma_store_memory)
@@ -95,98 +93,3 @@ def start_plasma_store(plasma_store_memory=DEFAULT_PLASMA_STORE_MEMORY,
         pid = subprocess.Popen(command, stdout=stdout_file, stderr=stderr_file)
         time.sleep(0.1)
     return plasma_store_name, pid
-
-
-def new_port():
-    return random.randint(10000, 65535)
-
-
-def start_plasma_manager(store_name,
-                         redis_address,
-                         node_ip_address="127.0.0.1",
-                         plasma_manager_port=None,
-                         num_retries=20,
-                         use_valgrind=False,
-                         run_profiler=False,
-                         stdout_file=None,
-                         stderr_file=None):
-    """Start a plasma manager and return the ports it listens on.
-
-    Args:
-        store_name (str): The name of the plasma store socket.
-        redis_address (str): The address of the Redis server.
-        node_ip_address (str): The IP address of the node.
-        plasma_manager_port (int): The port to use for the plasma manager. If
-            this is not provided, a port will be generated at random.
-        use_valgrind (bool): True if the Plasma manager should be started
-            inside of valgrind and False otherwise.
-        stdout_file: A file handle opened for writing to redirect stdout to. If
-            no redirection should happen, then this should be None.
-        stderr_file: A file handle opened for writing to redirect stderr to. If
-            no redirection should happen, then this should be None.
-
-      Returns:
-          A tuple of the Plasma manager socket name, the process ID of the
-              Plasma manager process, and the port that the manager is
-              listening on.
-
-    Raises:
-        Exception: An exception is raised if the manager could not be started.
-    """
-    plasma_manager_executable = os.path.join(
-        os.path.abspath(os.path.dirname(__file__)),
-        "../core/src/plasma/plasma_manager")
-    plasma_manager_name = "/tmp/plasma_manager{}".format(random_name())
-    if plasma_manager_port is not None:
-        if num_retries != 1:
-            raise Exception("num_retries must be 1 if port is specified.")
-    else:
-        plasma_manager_port = new_port()
-    process = None
-    counter = 0
-    while counter < num_retries:
-        if counter > 0:
-            print("Plasma manager failed to start, retrying now.")
-        command = [
-            plasma_manager_executable,
-            "-s",
-            store_name,
-            "-m",
-            plasma_manager_name,
-            "-h",
-            node_ip_address,
-            "-p",
-            str(plasma_manager_port),
-            "-r",
-            redis_address,
-        ]
-        if use_valgrind:
-            process = subprocess.Popen(
-                [
-                    "valgrind", "--track-origins=yes", "--leak-check=full",
-                    "--show-leak-kinds=all", "--error-exitcode=1"
-                ] + command,
-                stdout=stdout_file,
-                stderr=stderr_file)
-        elif run_profiler:
-            process = subprocess.Popen(
-                (["valgrind", "--tool=callgrind"] + command),
-                stdout=stdout_file,
-                stderr=stderr_file)
-        else:
-            process = subprocess.Popen(
-                command, stdout=stdout_file, stderr=stderr_file)
-        # This sleep is critical. If the plasma_manager fails to start because
-        # the port is already in use, then we need it to fail within 0.1
-        # seconds.
-        if use_valgrind:
-            time.sleep(1)
-        else:
-            time.sleep(0.1)
-        # See if the process has terminated
-        if process.poll() is None:
-            return plasma_manager_name, process, plasma_manager_port
-        # Generate a new port and try again.
-        plasma_manager_port = new_port()
-        counter += 1
-    raise Exception("Couldn't start plasma manager.")
diff --git a/python/ray/plasma/test/test.py b/python/ray/plasma/test/test.py
deleted file mode 100644
index a67f2d255e3ac..0000000000000
--- a/python/ray/plasma/test/test.py
+++ /dev/null
@@ -1,559 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import numpy as np
-from numpy.testing import assert_equal
-import os
-import random
-import signal
-import subprocess
-import sys
-import threading
-import time
-import unittest
-
-# The ray import must come before the pyarrow import because ray modifies the
-# python path so that the right version of pyarrow is found.
-import ray
-from ray.plasma.utils import (random_object_id, create_object_with_id,
-                              create_object)
-import ray.ray_constants as ray_constants
-from ray import services
-import pyarrow as pa
-import pyarrow.plasma as plasma
-
-USE_VALGRIND = False
-PLASMA_STORE_MEMORY = 1000000000
-
-
-def random_name():
-    return str(random.randint(0, 99999999))
-
-
-def assert_get_object_equal(unit_test,
-                            client1,
-                            client2,
-                            object_id,
-                            memory_buffer=None,
-                            metadata=None):
-    client1_buff = client1.get_buffers([object_id])[0]
-    client2_buff = client2.get_buffers([object_id])[0]
-    client1_metadata = client1.get_metadata([object_id])[0]
-    client2_metadata = client2.get_metadata([object_id])[0]
-    unit_test.assertEqual(len(client1_buff), len(client2_buff))
-    unit_test.assertEqual(len(client1_metadata), len(client2_metadata))
-    # Check that the buffers from the two clients are the same.
-    assert_equal(
-        np.frombuffer(client1_buff, dtype="uint8"),
-        np.frombuffer(client2_buff, dtype="uint8"))
-    # Check that the metadata buffers from the two clients are the same.
-    assert_equal(
-        np.frombuffer(client1_metadata, dtype="uint8"),
-        np.frombuffer(client2_metadata, dtype="uint8"))
-    # If a reference buffer was provided, check that it is the same as well.
-    if memory_buffer is not None:
-        assert_equal(
-            np.frombuffer(memory_buffer, dtype="uint8"),
-            np.frombuffer(client1_buff, dtype="uint8"))
-    # If reference metadata was provided, check that it is the same as well.
-    if metadata is not None:
-        assert_equal(
-            np.frombuffer(metadata, dtype="uint8"),
-            np.frombuffer(client1_metadata, dtype="uint8"))
-
-
-DEFAULT_PLASMA_STORE_MEMORY = 10**9
-
-
-def start_plasma_store(plasma_store_memory=DEFAULT_PLASMA_STORE_MEMORY,
-                       use_valgrind=False,
-                       use_profiler=False,
-                       stdout_file=None,
-                       stderr_file=None):
-    """Start a plasma store process.
-    Args:
-        use_valgrind (bool): True if the plasma store should be started inside
-            of valgrind. If this is True, use_profiler must be False.
-        use_profiler (bool): True if the plasma store should be started inside
-            a profiler. If this is True, use_valgrind must be False.
-        stdout_file: A file handle opened for writing to redirect stdout to. If
-            no redirection should happen, then this should be None.
-        stderr_file: A file handle opened for writing to redirect stderr to. If
-            no redirection should happen, then this should be None.
-    Return:
-        A tuple of the name of the plasma store socket and the process ID of
-            the plasma store process.
-    """
-    if use_valgrind and use_profiler:
-        raise Exception("Cannot use valgrind and profiler at the same time.")
-    plasma_store_executable = os.path.join(pa.__path__[0],
-                                           "plasma_store_server")
-    plasma_store_name = "/tmp/plasma_store{}".format(random_name())
-    command = [
-        plasma_store_executable, "-s", plasma_store_name, "-m",
-        str(plasma_store_memory)
-    ]
-    if use_valgrind:
-        pid = subprocess.Popen(
-            [
-                "valgrind", "--track-origins=yes", "--leak-check=full",
-                "--show-leak-kinds=all", "--leak-check-heuristics=stdstring",
-                "--error-exitcode=1"
-            ] + command,
-            stdout=stdout_file,
-            stderr=stderr_file)
-        time.sleep(1.0)
-    elif use_profiler:
-        pid = subprocess.Popen(
-            ["valgrind", "--tool=callgrind"] + command,
-            stdout=stdout_file,
-            stderr=stderr_file)
-        time.sleep(1.0)
-    else:
-        pid = subprocess.Popen(command, stdout=stdout_file, stderr=stderr_file)
-        time.sleep(0.1)
-    return plasma_store_name, pid
-
-
-# Plasma client tests were moved into arrow
-
-
-class TestPlasmaManager(unittest.TestCase):
-    def setUp(self):
-        # Start two PlasmaStores.
-        store_name1, self.p2 = start_plasma_store(use_valgrind=USE_VALGRIND)
-        store_name2, self.p3 = start_plasma_store(use_valgrind=USE_VALGRIND)
-        # Start a Redis server.
-        redis_address, _ = services.start_redis("127.0.0.1")
-        # Start two PlasmaManagers.
-        manager_name1, self.p4, self.port1 = ray.plasma.start_plasma_manager(
-            store_name1, redis_address, use_valgrind=USE_VALGRIND)
-        manager_name2, self.p5, self.port2 = ray.plasma.start_plasma_manager(
-            store_name2, redis_address, use_valgrind=USE_VALGRIND)
-        # Connect two PlasmaClients.
-        self.client1 = plasma.connect(store_name1, manager_name1, 64)
-        self.client2 = plasma.connect(store_name2, manager_name2, 64)
-
-        # Store the processes that will be explicitly killed during tearDown so
-        # that a test case can remove ones that will be killed during the test.
-        # NOTE: If this specific order is changed, valgrind will fail.
-        self.processes_to_kill = [self.p4, self.p5, self.p2, self.p3]
-
-    def tearDown(self):
-        # Check that the processes are still alive.
-        for process in self.processes_to_kill:
-            self.assertEqual(process.poll(), None)
-
-        # Kill the Plasma store and Plasma manager processes.
-        if USE_VALGRIND:
-            # Give processes opportunity to finish work.
-            time.sleep(1)
-            for process in self.processes_to_kill:
-                process.send_signal(signal.SIGTERM)
-                process.wait()
-                if process.returncode != 0:
-                    print("aborting due to valgrind error")
-                    os._exit(-1)
-        else:
-            for process in self.processes_to_kill:
-                process.kill()
-
-        # Clean up the Redis server.
-        services.cleanup()
-
-    def test_fetch(self):
-        for _ in range(10):
-            # Create an object.
-            object_id1, memory_buffer1, metadata1 = create_object(
-                self.client1, 2000, 2000)
-            self.client1.fetch([object_id1])
-            self.assertEqual(self.client1.contains(object_id1), True)
-            self.assertEqual(self.client2.contains(object_id1), False)
-            # Fetch the object from the other plasma manager.
-            # TODO(rkn): Right now we must wait for the object table to be
-            # updated.
-            while not self.client2.contains(object_id1):
-                self.client2.fetch([object_id1])
-            # Compare the two buffers.
-            assert_get_object_equal(
-                self,
-                self.client1,
-                self.client2,
-                object_id1,
-                memory_buffer=memory_buffer1,
-                metadata=metadata1)
-
-        # Test that we can call fetch on object IDs that don't exist yet.
-        object_id2 = random_object_id()
-        self.client1.fetch([object_id2])
-        self.assertEqual(self.client1.contains(object_id2), False)
-        memory_buffer2, metadata2 = create_object_with_id(
-            self.client2, object_id2, 2000, 2000)
-        # # Check that the object has been fetched.
-        # self.assertEqual(self.client1.contains(object_id2), True)
-        # Compare the two buffers.
-        # assert_get_object_equal(self, self.client1, self.client2, object_id2,
-        #                         memory_buffer=memory_buffer2,
-        #                         metadata=metadata2)
-
-        # Test calling the same fetch request a bunch of times.
-        object_id3 = random_object_id()
-        self.assertEqual(self.client1.contains(object_id3), False)
-        self.assertEqual(self.client2.contains(object_id3), False)
-        for _ in range(10):
-            self.client1.fetch([object_id3])
-            self.client2.fetch([object_id3])
-        memory_buffer3, metadata3 = create_object_with_id(
-            self.client1, object_id3, 2000, 2000)
-        for _ in range(10):
-            self.client1.fetch([object_id3])
-            self.client2.fetch([object_id3])
-        # TODO(rkn): Right now we must wait for the object table to be updated.
-        while not self.client2.contains(object_id3):
-            self.client2.fetch([object_id3])
-        assert_get_object_equal(
-            self,
-            self.client1,
-            self.client2,
-            object_id3,
-            memory_buffer=memory_buffer3,
-            metadata=metadata3)
-
-    def test_fetch_multiple(self):
-        for _ in range(20):
-            # Create two objects and a third fake one that doesn't exist.
-            object_id1, memory_buffer1, metadata1 = create_object(
-                self.client1, 2000, 2000)
-            missing_object_id = random_object_id()
-            object_id2, memory_buffer2, metadata2 = create_object(
-                self.client1, 2000, 2000)
-            object_ids = [object_id1, missing_object_id, object_id2]
-            # Fetch the objects from the other plasma store. The second object
-            # ID should timeout since it does not exist.
-            # TODO(rkn): Right now we must wait for the object table to be
-            # updated.
-            while ((not self.client2.contains(object_id1))
-                   or (not self.client2.contains(object_id2))):
-                self.client2.fetch(object_ids)
-            # Compare the buffers of the objects that do exist.
-            assert_get_object_equal(
-                self,
-                self.client1,
-                self.client2,
-                object_id1,
-                memory_buffer=memory_buffer1,
-                metadata=metadata1)
-            assert_get_object_equal(
-                self,
-                self.client1,
-                self.client2,
-                object_id2,
-                memory_buffer=memory_buffer2,
-                metadata=metadata2)
-            # Fetch in the other direction. The fake object still does not
-            # exist.
-            self.client1.fetch(object_ids)
-            assert_get_object_equal(
-                self,
-                self.client2,
-                self.client1,
-                object_id1,
-                memory_buffer=memory_buffer1,
-                metadata=metadata1)
-            assert_get_object_equal(
-                self,
-                self.client2,
-                self.client1,
-                object_id2,
-                memory_buffer=memory_buffer2,
-                metadata=metadata2)
-
-        # Check that we can call fetch with duplicated object IDs.
-        object_id3 = random_object_id()
-        self.client1.fetch([object_id3, object_id3])
-        object_id4, memory_buffer4, metadata4 = create_object(
-            self.client1, 2000, 2000)
-        time.sleep(0.1)
-        # TODO(rkn): Right now we must wait for the object table to be updated.
-        while not self.client2.contains(object_id4):
-            self.client2.fetch(
-                [object_id3, object_id3, object_id4, object_id4])
-        assert_get_object_equal(
-            self,
-            self.client2,
-            self.client1,
-            object_id4,
-            memory_buffer=memory_buffer4,
-            metadata=metadata4)
-
-    def test_wait(self):
-        # Test timeout.
-        obj_id0 = random_object_id()
-        self.client1.wait([obj_id0], timeout=100, num_returns=1)
-        # If we get here, the test worked.
-
-        # Test wait if local objects available.
-        obj_id1 = random_object_id()
-        self.client1.create(obj_id1, 1000)
-        self.client1.seal(obj_id1)
-        ready, waiting = self.client1.wait(
-            [obj_id1], timeout=100, num_returns=1)
-        self.assertEqual(set(ready), {obj_id1})
-        self.assertEqual(waiting, [])
-
-        # Test wait if only one object available and only one object waited
-        # for.
-        obj_id2 = random_object_id()
-        self.client1.create(obj_id2, 1000)
-        # Don't seal.
-        ready, waiting = self.client1.wait(
-            [obj_id2, obj_id1], timeout=100, num_returns=1)
-        self.assertEqual(set(ready), {obj_id1})
-        self.assertEqual(set(waiting), {obj_id2})
-
-        # Test wait if object is sealed later.
-        obj_id3 = random_object_id()
-
-        def finish():
-            self.client2.create(obj_id3, 1000)
-            self.client2.seal(obj_id3)
-
-        t = threading.Timer(0.1, finish)
-        t.start()
-        ready, waiting = self.client1.wait(
-            [obj_id3, obj_id2, obj_id1], timeout=1000, num_returns=2)
-        self.assertEqual(set(ready), {obj_id1, obj_id3})
-        self.assertEqual(set(waiting), {obj_id2})
-
-        # Test if the appropriate number of objects is shown if some objects
-        # are not ready.
-        ready, waiting = self.client1.wait([obj_id3, obj_id2, obj_id1], 100, 3)
-        self.assertEqual(set(ready), {obj_id1, obj_id3})
-        self.assertEqual(set(waiting), {obj_id2})
-
-        # Don't forget to seal obj_id2.
-        self.client1.seal(obj_id2)
-
-        # Test calling wait a bunch of times.
-        object_ids = []
-        # TODO(rkn): Increasing n to 100 (or larger) will cause failures. The
-        # problem appears to be that the number of timers added to the manager
-        # event loop slow down the manager so much that some of the
-        # asynchronous Redis commands timeout triggering fatal failure
-        # callbacks.
-        n = 40
-        for i in range(n * (n + 1) // 2):
-            if i % 2 == 0:
-                object_id, _, _ = create_object(self.client1, 200, 200)
-            else:
-                object_id, _, _ = create_object(self.client2, 200, 200)
-            object_ids.append(object_id)
-        # Try waiting for all of the object IDs on the first client.
-        waiting = object_ids
-        retrieved = []
-        for i in range(1, n + 1):
-            ready, waiting = self.client1.wait(
-                waiting, timeout=1000, num_returns=i)
-            self.assertEqual(len(ready), i)
-            retrieved += ready
-        self.assertEqual(set(retrieved), set(object_ids))
-        ready, waiting = self.client1.wait(
-            object_ids, timeout=1000, num_returns=len(object_ids))
-        self.assertEqual(set(ready), set(object_ids))
-        self.assertEqual(waiting, [])
-        # Try waiting for all of the object IDs on the second client.
-        waiting = object_ids
-        retrieved = []
-        for i in range(1, n + 1):
-            ready, waiting = self.client2.wait(
-                waiting, timeout=1000, num_returns=i)
-            self.assertEqual(len(ready), i)
-            retrieved += ready
-        self.assertEqual(set(retrieved), set(object_ids))
-        ready, waiting = self.client2.wait(
-            object_ids, timeout=1000, num_returns=len(object_ids))
-        self.assertEqual(set(ready), set(object_ids))
-        self.assertEqual(waiting, [])
-
-        # Make sure that wait returns when the requested number of object IDs
-        # are available and does not wait for all object IDs to be available.
-        object_ids = [random_object_id() for _ in range(9)] + \
-                     [plasma.ObjectID(ray_constants.ID_SIZE * b'\x00')]
-        object_ids_perm = object_ids[:]
-        random.shuffle(object_ids_perm)
-        for i in range(10):
-            if i % 2 == 0:
-                create_object_with_id(self.client1, object_ids_perm[i], 2000,
-                                      2000)
-            else:
-                create_object_with_id(self.client2, object_ids_perm[i], 2000,
-                                      2000)
-            ready, waiting = self.client1.wait(object_ids, num_returns=(i + 1))
-            self.assertEqual(set(ready), set(object_ids_perm[:(i + 1)]))
-            self.assertEqual(set(waiting), set(object_ids_perm[(i + 1):]))
-
-    def test_transfer(self):
-        num_attempts = 100
-        for _ in range(100):
-            # Create an object.
-            object_id1, memory_buffer1, metadata1 = create_object(
-                self.client1, 2000, 2000)
-            # Transfer the buffer to the the other Plasma store. There is a
-            # race condition on the create and transfer of the object, so keep
-            # trying until the object appears on the second Plasma store.
-            for i in range(num_attempts):
-                self.client1.transfer("127.0.0.1", self.port2, object_id1)
-                buff = self.client2.get_buffers(
-                    [object_id1], timeout_ms=100)[0]
-                if buff is not None:
-                    break
-            self.assertNotEqual(buff, None)
-            del buff
-
-            # Compare the two buffers.
-            assert_get_object_equal(
-                self,
-                self.client1,
-                self.client2,
-                object_id1,
-                memory_buffer=memory_buffer1,
-                metadata=metadata1)
-            # # Transfer the buffer again.
-            # self.client1.transfer("127.0.0.1", self.port2, object_id1)
-            # # Compare the two buffers.
-            # assert_get_object_equal(self, self.client1, self.client2,
-            #                         object_id1,
-            #                         memory_buffer=memory_buffer1,
-            #                         metadata=metadata1)
-
-            # Create an object.
-            object_id2, memory_buffer2, metadata2 = create_object(
-                self.client2, 20000, 20000)
-            # Transfer the buffer to the the other Plasma store. There is a
-            # race condition on the create and transfer of the object, so keep
-            # trying until the object appears on the second Plasma store.
-            for i in range(num_attempts):
-                self.client2.transfer("127.0.0.1", self.port1, object_id2)
-                buff = self.client1.get_buffers(
-                    [object_id2], timeout_ms=100)[0]
-                if buff is not None:
-                    break
-            self.assertNotEqual(buff, None)
-            del buff
-
-            # Compare the two buffers.
-            assert_get_object_equal(
-                self,
-                self.client1,
-                self.client2,
-                object_id2,
-                memory_buffer=memory_buffer2,
-                metadata=metadata2)
-
-    def test_illegal_functionality(self):
-        # Create an object id string.
-        # object_id = random_object_id()
-        # Create a new buffer.
-        # memory_buffer = self.client1.create(object_id, 20000)
-        # This test is commented out because it currently fails.
-        # # Transferring the buffer before sealing it should fail.
-        # self.assertRaises(Exception,
-        #                   lambda : self.manager1.transfer(1, object_id))
-        pass
-
-    def test_stresstest(self):
-        a = time.time()
-        object_ids = []
-        for i in range(10000):  # TODO(pcm): increase this to 100000.
-            object_id = random_object_id()
-            object_ids.append(object_id)
-            self.client1.create(object_id, 1)
-            self.client1.seal(object_id)
-        for object_id in object_ids:
-            self.client1.transfer("127.0.0.1", self.port2, object_id)
-        b = time.time() - a
-
-        print("it took", b, "seconds to put and transfer the objects")
-
-
-class TestPlasmaManagerRecovery(unittest.TestCase):
-    def setUp(self):
-        # Start a Plasma store.
-        self.store_name, self.p2 = start_plasma_store(
-            use_valgrind=USE_VALGRIND)
-        # Start a Redis server.
-        self.redis_address, _ = services.start_redis("127.0.0.1")
-        # Start a PlasmaManagers.
-        manager_name, self.p3, self.port1 = ray.plasma.start_plasma_manager(
-            self.store_name, self.redis_address, use_valgrind=USE_VALGRIND)
-        # Connect a PlasmaClient.
-        self.client = plasma.connect(self.store_name, manager_name, 64)
-
-        # Store the processes that will be explicitly killed during tearDown so
-        # that a test case can remove ones that will be killed during the test.
-        # NOTE: The plasma managers must be killed before the plasma store
-        # since plasma store death will bring down the managers.
-        self.processes_to_kill = [self.p3, self.p2]
-
-    def tearDown(self):
-        # Check that the processes are still alive.
-        for process in self.processes_to_kill:
-            self.assertEqual(process.poll(), None)
-
-        # Kill the Plasma store and Plasma manager processes.
-        if USE_VALGRIND:
-            # Give processes opportunity to finish work.
-            time.sleep(1)
-            for process in self.processes_to_kill:
-                process.send_signal(signal.SIGTERM)
-                process.wait()
-                if process.returncode != 0:
-                    print("aborting due to valgrind error")
-                    os._exit(-1)
-        else:
-            for process in self.processes_to_kill:
-                process.kill()
-
-        # Clean up the Redis server.
-        services.cleanup()
-
-    def test_delayed_start(self):
-        num_objects = 10
-        # Create some objects using one client.
-        object_ids = [random_object_id() for _ in range(num_objects)]
-        for i in range(10):
-            create_object_with_id(self.client, object_ids[i], 2000, 2000)
-
-        # Wait until the objects have been sealed in the store.
-        ready, waiting = self.client.wait(object_ids, num_returns=num_objects)
-        self.assertEqual(set(ready), set(object_ids))
-        self.assertEqual(waiting, [])
-
-        # Start a second plasma manager attached to the same store.
-        manager_name, self.p5, self.port2 = ray.plasma.start_plasma_manager(
-            self.store_name, self.redis_address, use_valgrind=USE_VALGRIND)
-        self.processes_to_kill = [self.p5] + self.processes_to_kill
-
-        # Check that the second manager knows about existing objects.
-        client2 = plasma.connect(self.store_name, manager_name, 64)
-        ready, waiting = [], object_ids
-        while True:
-            ready, waiting = client2.wait(
-                object_ids, num_returns=num_objects, timeout=0)
-            if len(ready) == len(object_ids):
-                break
-
-        self.assertEqual(set(ready), set(object_ids))
-        self.assertEqual(waiting, [])
-
-
-if __name__ == "__main__":
-    if len(sys.argv) > 1:
-        # Pop the argument so we don't mess with unittest's own argument
-        # parser.
-        if sys.argv[-1] == "valgrind":
-            arg = sys.argv.pop()
-            USE_VALGRIND = True
-            print("Using valgrind for tests")
-    unittest.main(verbosity=2)
diff --git a/python/ray/plasma/utils.py b/python/ray/plasma/utils.py
deleted file mode 100644
index 45feb0b1db582..0000000000000
--- a/python/ray/plasma/utils.py
+++ /dev/null
@@ -1,53 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import numpy as np
-import random
-
-import pyarrow.plasma as plasma
-import ray.ray_constants as ray_constants
-
-
-def random_object_id():
-    return plasma.ObjectID(np.random.bytes(ray_constants.ID_SIZE))
-
-
-def generate_metadata(length):
-    metadata_buffer = bytearray(length)
-    if length > 0:
-        metadata_buffer[0] = random.randint(0, 255)
-        metadata_buffer[-1] = random.randint(0, 255)
-        for _ in range(100):
-            metadata_buffer[random.randint(0, length - 1)] = (random.randint(
-                0, 255))
-    return metadata_buffer
-
-
-def write_to_data_buffer(buff, length):
-    array = np.frombuffer(buff, dtype="uint8")
-    if length > 0:
-        array[0] = random.randint(0, 255)
-        array[-1] = random.randint(0, 255)
-        for _ in range(100):
-            array[random.randint(0, length - 1)] = random.randint(0, 255)
-
-
-def create_object_with_id(client,
-                          object_id,
-                          data_size,
-                          metadata_size,
-                          seal=True):
-    metadata = generate_metadata(metadata_size)
-    memory_buffer = client.create(object_id, data_size, metadata)
-    write_to_data_buffer(memory_buffer, data_size)
-    if seal:
-        client.seal(object_id)
-    return memory_buffer, metadata
-
-
-def create_object(client, data_size, metadata_size, seal=True):
-    object_id = random_object_id()
-    memory_buffer, metadata = create_object_with_id(
-        client, object_id, data_size, metadata_size, seal=seal)
-    return object_id, memory_buffer, metadata
diff --git a/python/ray/profiling.py b/python/ray/profiling.py
index e4c2d438fc2aa..8cdd8296ed611 100644
--- a/python/ray/profiling.py
+++ b/python/ray/profiling.py
@@ -59,17 +59,7 @@ def profile(event_type, extra_data=None, worker=None):
     """
     if worker is None:
         worker = ray.worker.global_worker
-    if not worker.use_raylet:
-        # Log the event if this is a worker and not a driver, since the
-        # driver's event log never gets flushed.
-        if worker.mode == ray.WORKER_MODE:
-            return RayLogSpanNonRaylet(
-                worker.profiler, event_type, contents=extra_data)
-        else:
-            return NULL_LOG_SPAN
-    else:
-        return RayLogSpanRaylet(
-            worker.profiler, event_type, extra_data=extra_data)
+    return RayLogSpanRaylet(worker.profiler, event_type, extra_data=extra_data)
 
 
 class Profiler(object):
@@ -124,85 +114,31 @@ def flush_profile_data(self):
             events = self.events
             self.events = []
 
-        if not self.worker.use_raylet:
-            event_log_key = b"event_log:" + self.worker.worker_id
-            event_log_value = json.dumps(events)
-            self.worker.local_scheduler_client.log_event(
-                event_log_key, event_log_value, time.time())
+        if self.worker.mode == ray.WORKER_MODE:
+            component_type = "worker"
         else:
-            if self.worker.mode == ray.WORKER_MODE:
-                component_type = "worker"
-            else:
-                component_type = "driver"
+            component_type = "driver"
 
-            self.worker.local_scheduler_client.push_profile_events(
-                component_type, ray.ObjectID(self.worker.worker_id),
-                self.worker.node_ip_address, events)
+        self.worker.local_scheduler_client.push_profile_events(
+            component_type, ray.ObjectID(self.worker.worker_id),
+            self.worker.node_ip_address, events)
 
     def add_event(self, event):
         with self.lock:
             self.events.append(event)
 
 
-class RayLogSpanNonRaylet(object):
-    """An object used to enable logging a span of events with a with statement.
-
-    Attributes:
-        event_type (str): The type of the event being logged.
-        contents: Additional information to log.
-    """
-
-    def __init__(self, profiler, event_type, contents=None):
-        """Initialize a RayLogSpanNonRaylet object."""
-        self.profiler = profiler
-        self.event_type = event_type
-        self.contents = contents
-
-    def _log(self, event_type, kind, contents=None):
-        """Log an event to the global state store.
-
-        This adds the event to a buffer of events locally. The buffer can be
-        flushed and written to the global state store by calling
-        flush_profile_data().
+class NoopProfiler(object):
+    """A no-op profile used when collect_profile_data=False."""
 
-        Args:
-            event_type (str): The type of the event.
-            contents: More general data to store with the event.
-            kind (int): Either LOG_POINT, LOG_SPAN_START, or LOG_SPAN_END. This
-                is LOG_POINT if the event being logged happens at a single
-                point in time. It is LOG_SPAN_START if we are starting to log a
-                span of time, and it is LOG_SPAN_END if we are finishing
-                logging a span of time.
-        """
-        # TODO(rkn): This code currently takes around half a microsecond. Since
-        # we call it tens of times per task, this adds up. We will need to redo
-        # the logging code, perhaps in C.
-        contents = {} if contents is None else contents
-        assert isinstance(contents, dict)
-        # Make sure all of the keys and values in the dictionary are strings.
-        contents = {str(k): str(v) for k, v in contents.items()}
-        self.profiler.add_event((time.time(), event_type, kind, contents))
+    def start_flush_thread(self):
+        pass
 
-    def __enter__(self):
-        """Log the beginning of a span event."""
-        self._log(
-            event_type=self.event_type,
-            contents=self.contents,
-            kind=LOG_SPAN_START)
+    def flush_profile_data(self):
+        pass
 
-    def __exit__(self, type, value, tb):
-        """Log the end of a span event. Log any exception that occurred."""
-        if type is None:
-            self._log(event_type=self.event_type, kind=LOG_SPAN_END)
-        else:
-            self._log(
-                event_type=self.event_type,
-                contents={
-                    "type": str(type),
-                    "value": value,
-                    "traceback": traceback.format_exc()
-                },
-                kind=LOG_SPAN_END)
+    def add_event(self, event):
+        pass
 
 
 class RayLogSpanRaylet(object):
@@ -230,8 +166,9 @@ def set_attribute(self, key, value):
             value: The attribute value.
         """
         if not isinstance(key, str) or not isinstance(value, str):
-            raise ValueError("The extra_data argument must be a "
-                             "dictionary mapping strings to strings.")
+            raise ValueError("The arguments 'key' and 'value' must both be "
+                             "strings. Instead they are {} and {}.".format(
+                                 key, value))
         self.extra_data[key] = value
 
     def __enter__(self):
@@ -250,7 +187,8 @@ def __exit__(self, type, value, tb):
         for key, value in self.extra_data.items():
             if not isinstance(key, str) or not isinstance(value, str):
                 raise ValueError("The extra_data argument must be a "
-                                 "dictionary mapping strings to strings.")
+                                 "dictionary mapping strings to strings. "
+                                 "Instead it is {}.".format(self.extra_data))
 
         if type is not None:
             extra_data = json.dumps({
diff --git a/python/ray/ray_constants.py b/python/ray/ray_constants.py
index a9e4519d4cf5d..a1d5e1a765438 100644
--- a/python/ray/ray_constants.py
+++ b/python/ray/ray_constants.py
@@ -5,7 +5,7 @@
 
 import os
 
-import ray
+from ray.raylet import ObjectID
 
 
 def env_integer(key, default):
@@ -15,7 +15,7 @@ def env_integer(key, default):
 
 
 ID_SIZE = 20
-NIL_JOB_ID = ray.ObjectID(ID_SIZE * b"\xff")
+NIL_JOB_ID = ObjectID(ID_SIZE * b"\xff")
 
 # If a remote function or actor (or some other export) has serialized size
 # greater than this quantity, print an warning.
@@ -41,7 +41,6 @@ def env_integer(key, default):
 WORKER_CRASH_PUSH_ERROR = "worker_crash"
 WORKER_DIED_PUSH_ERROR = "worker_died"
 PUT_RECONSTRUCTION_PUSH_ERROR = "put_reconstruction"
-HASH_MISMATCH_PUSH_ERROR = "object_hash_mismatch"
 INFEASIBLE_TASK_ERROR = "infeasible_task"
 REMOVED_NODE_ERROR = "node_removed"
 MONITOR_DIED_ERROR = "monitor_died"
diff --git a/python/ray/local_scheduler/__init__.py b/python/ray/raylet/__init__.py
similarity index 76%
rename from python/ray/local_scheduler/__init__.py
rename to python/ray/raylet/__init__.py
index a469776f133b6..8757f59741567 100644
--- a/python/ray/local_scheduler/__init__.py
+++ b/python/ray/raylet/__init__.py
@@ -2,10 +2,9 @@
 from __future__ import division
 from __future__ import print_function
 
-from ray.core.src.local_scheduler.liblocal_scheduler_library_python import (
+from ray.core.src.ray.raylet.liblocal_scheduler_library_python import (
     Task, LocalSchedulerClient, ObjectID, check_simple_value, compute_task_id,
     task_from_string, task_to_string, _config, common_error)
-from .local_scheduler_services import start_local_scheduler
 
 __all__ = [
     "Task", "LocalSchedulerClient", "ObjectID", "check_simple_value",
diff --git a/python/ray/remote_function.py b/python/ray/remote_function.py
index 287d3d045539f..fb2a29e45c512 100644
--- a/python/ray/remote_function.py
+++ b/python/ray/remote_function.py
@@ -5,6 +5,7 @@
 import copy
 import hashlib
 import inspect
+import logging
 
 import ray.ray_constants as ray_constants
 import ray.signature
@@ -14,6 +15,8 @@
 DEFAULT_REMOTE_FUNCTION_NUM_RETURN_VALS = 1
 DEFAULT_REMOTE_FUNCTION_MAX_CALLS = 0
 
+logger = logging.getLogger(__name__)
+
 
 def compute_function_id(function):
     """Compute an function ID for a function.
@@ -22,7 +25,7 @@ def compute_function_id(function):
         func: The actual function.
 
     Returns:
-        This returns the function ID.
+        Raw bytes of the function id
     """
     function_id_hash = hashlib.sha1()
     # Include the function module and name in the hash.
@@ -39,8 +42,6 @@ def compute_function_id(function):
     # Compute the function ID.
     function_id = function_id_hash.digest()
     assert len(function_id) == ray_constants.ID_SIZE
-    function_id = ray.ObjectID(function_id)
-
     return function_id
 
 
@@ -72,7 +73,7 @@ def __init__(self, function, num_cpus, num_gpus, resources,
         # TODO(rkn): We store the function ID as a string, so that
         # RemoteFunction objects can be pickled. We should undo this when
         # we allow ObjectIDs to be pickled.
-        self._function_id = compute_function_id(self._function).id()
+        self._function_id = compute_function_id(function)
         self._function_name = (
             self._function.__module__ + '.' + self._function.__name__)
         self._num_cpus = (DEFAULT_REMOTE_FUNCTION_CPUS
@@ -90,11 +91,7 @@ def __init__(self, function, num_cpus, num_gpus, resources,
 
         # # Export the function.
         worker = ray.worker.get_global_worker()
-        if worker.mode == ray.worker.SCRIPT_MODE:
-            self._export()
-        elif worker.mode is None:
-            worker.cached_remote_functions_and_actors.append(
-                ("remote_function", self))
+        worker.function_actor_manager.export(self)
 
     def __call__(self, *args, **kwargs):
         raise Exception("Remote functions cannot be called directly. Instead "
@@ -103,7 +100,7 @@ def __call__(self, *args, **kwargs):
 
     def remote(self, *args, **kwargs):
         """This runs immediately when a remote function is called."""
-        return self._submit(args=args, kwargs=kwargs)
+        return self._remote(args=args, kwargs=kwargs)
 
     def _submit(self,
                 args=None,
@@ -112,6 +109,23 @@ def _submit(self,
                 num_cpus=None,
                 num_gpus=None,
                 resources=None):
+        logger.warn(
+            "WARNING: _submit() is being deprecated. Please use _remote().")
+        return self._remote(
+            args=args,
+            kwargs=kwargs,
+            num_return_vals=num_return_vals,
+            num_cpus=num_cpus,
+            num_gpus=num_gpus,
+            resources=resources)
+
+    def _remote(self,
+                args=None,
+                kwargs=None,
+                num_return_vals=None,
+                num_cpus=None,
+                num_gpus=None,
+                resources=None):
         """An experimental alternate way to submit remote functions."""
         worker = ray.worker.get_global_worker()
         worker.check_connected()
@@ -141,9 +155,3 @@ def _submit(self,
             return object_ids[0]
         elif len(object_ids) > 1:
             return object_ids
-
-    def _export(self):
-        worker = ray.worker.get_global_worker()
-        worker.export_remote_function(
-            ray.ObjectID(self._function_id), self._function_name,
-            self._function, self._max_calls, self)
diff --git a/python/ray/rllib/__init__.py b/python/ray/rllib/__init__.py
index db9f52687126c..fd6ba3407eaec 100644
--- a/python/ray/rllib/__init__.py
+++ b/python/ray/rllib/__init__.py
@@ -2,6 +2,8 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
+
 # Note: do not introduce unnecessary library dependencies here, e.g. gym.
 # This file is imported from the tune module in order to register RLlib agents.
 from ray.tune.registry import register_trainable
@@ -11,15 +13,26 @@
 from ray.rllib.env.async_vector_env import AsyncVectorEnv
 from ray.rllib.env.multi_agent_env import MultiAgentEnv
 from ray.rllib.env.vector_env import VectorEnv
-from ray.rllib.env.serving_env import ServingEnv
+from ray.rllib.env.external_env import ExternalEnv
 from ray.rllib.evaluation.policy_evaluator import PolicyEvaluator
 from ray.rllib.evaluation.sample_batch import SampleBatch
 
 
+def _setup_logger():
+    logger = logging.getLogger("ray.rllib")
+    handler = logging.StreamHandler()
+    handler.setFormatter(
+        logging.Formatter(
+            "%(asctime)s\t%(levelname)s %(filename)s:%(lineno)s -- %(message)s"
+        ))
+    logger.addHandler(handler)
+    logger.propagate = False
+
+
 def _register_all():
 
     for key in [
-            "PPO", "ES", "DQN", "APEX", "A3C", "BC", "PG", "DDPG", "APEX_DDPG",
+            "PPO", "ES", "DQN", "APEX", "A3C", "PG", "DDPG", "APEX_DDPG",
             "IMPALA", "ARS", "A2C", "__fake", "__sigmoid_fake_data",
             "__parameter_tuning"
     ]:
@@ -27,6 +40,7 @@ def _register_all():
         register_trainable(key, get_agent_class(key))
 
 
+_setup_logger()
 _register_all()
 
 __all__ = [
@@ -37,5 +51,5 @@ def _register_all():
     "AsyncVectorEnv",
     "MultiAgentEnv",
     "VectorEnv",
-    "ServingEnv",
+    "ExternalEnv",
 ]
diff --git a/python/ray/rllib/agents/a3c/a2c.py b/python/ray/rllib/agents/a3c/a2c.py
index a792d1d160831..c344592b90863 100644
--- a/python/ray/rllib/agents/a3c/a2c.py
+++ b/python/ray/rllib/agents/a3c/a2c.py
@@ -4,13 +4,12 @@
 
 from ray.rllib.agents.a3c.a3c import A3CAgent, DEFAULT_CONFIG as A3C_CONFIG
 from ray.rllib.optimizers import SyncSamplesOptimizer
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils import merge_dicts
-from ray.tune.trial import Resources
 
 A2C_DEFAULT_CONFIG = merge_dicts(
     A3C_CONFIG,
     {
-        "gpu": False,
         "sample_batch_size": 20,
         "min_iter_time_s": 10,
         "sample_async": False,
@@ -24,16 +23,8 @@ class A2CAgent(A3CAgent):
     _agent_name = "A2C"
     _default_config = A2C_DEFAULT_CONFIG
 
+    @override(A3CAgent)
     def _make_optimizer(self):
         return SyncSamplesOptimizer(self.local_evaluator,
                                     self.remote_evaluators,
                                     self.config["optimizer"])
-
-    @classmethod
-    def default_resource_request(cls, config):
-        cf = merge_dicts(cls._default_config, config)
-        return Resources(
-            cpu=1,
-            gpu=cf["gpu_fraction"] if cf["gpu"] else 0,
-            extra_cpu=cf["num_workers"],
-            extra_gpu=cf["use_gpu_for_workers"] and cf["num_workers"] or 0)
diff --git a/python/ray/rllib/agents/a3c/a3c.py b/python/ray/rllib/agents/a3c/a3c.py
index afda9506248d3..43daa0b3ef781 100644
--- a/python/ray/rllib/agents/a3c/a3c.py
+++ b/python/ray/rllib/agents/a3c/a3c.py
@@ -7,9 +7,10 @@
 from ray.rllib.agents.a3c.a3c_tf_policy_graph import A3CPolicyGraph
 from ray.rllib.agents.agent import Agent, with_common_config
 from ray.rllib.optimizers import AsyncGradientsOptimizer
-from ray.rllib.utils import merge_dicts
-from ray.tune.trial import Resources
+from ray.rllib.utils.annotations import override
 
+# yapf: disable
+# __sphinx_doc_begin__
 DEFAULT_CONFIG = with_common_config({
     # Size of rollout batch
     "sample_batch_size": 10,
@@ -27,37 +28,14 @@
     "vf_loss_coeff": 0.5,
     # Entropy coefficient
     "entropy_coeff": -0.01,
-    # Whether to place workers on GPUs
-    "use_gpu_for_workers": False,
     # Min time per iteration
     "min_iter_time_s": 5,
     # Workers sample async. Note that this increases the effective
     # sample_batch_size by up to 5x due to async buffering of batches.
     "sample_async": True,
-    # Model and preprocessor options
-    "model": {
-        # Use LSTM model. Requires TF.
-        "use_lstm": False,
-        # Max seq length for LSTM training.
-        "max_seq_len": 20,
-        # (Image statespace) - Converts image to Channels = 1
-        "grayscale": True,
-        # (Image statespace) - Each pixel
-        "zero_mean": False,
-        # (Image statespace) - Converts image to (dim, dim, C)
-        "dim": 84,
-        # (Image statespace) - Converts image shape to (C, dim, dim)
-        "channel_major": False,
-    },
-    # Configure TF for single-process operation
-    "tf_session_args": {
-        "intra_op_parallelism_threads": 1,
-        "inter_op_parallelism_threads": 1,
-        "gpu_options": {
-            "allow_growth": True,
-        },
-    },
 })
+# __sphinx_doc_end__
+# yapf: enable
 
 
 class A3CAgent(Agent):
@@ -67,15 +45,7 @@ class A3CAgent(Agent):
     _default_config = DEFAULT_CONFIG
     _policy_graph = A3CPolicyGraph
 
-    @classmethod
-    def default_resource_request(cls, config):
-        cf = merge_dicts(cls._default_config, config)
-        return Resources(
-            cpu=1,
-            gpu=0,
-            extra_cpu=cf["num_workers"],
-            extra_gpu=cf["use_gpu_for_workers"] and cf["num_workers"] or 0)
-
+    @override(Agent)
     def _init(self):
         if self.config["use_pytorch"]:
             from ray.rllib.agents.a3c.a3c_torch_policy_graph import \
@@ -87,21 +57,22 @@ def _init(self):
         self.local_evaluator = self.make_local_evaluator(
             self.env_creator, policy_cls)
         self.remote_evaluators = self.make_remote_evaluators(
-            self.env_creator, policy_cls, self.config["num_workers"],
-            {"num_gpus": 1 if self.config["use_gpu_for_workers"] else 0})
+            self.env_creator, policy_cls, self.config["num_workers"])
         self.optimizer = self._make_optimizer()
 
-    def _make_optimizer(self):
-        return AsyncGradientsOptimizer(self.local_evaluator,
-                                       self.remote_evaluators,
-                                       self.config["optimizer"])
-
+    @override(Agent)
     def _train(self):
         prev_steps = self.optimizer.num_steps_sampled
         start = time.time()
         while time.time() - start < self.config["min_iter_time_s"]:
             self.optimizer.step()
-        result = self.optimizer.collect_metrics()
+        result = self.optimizer.collect_metrics(
+            self.config["collect_metrics_timeout"])
         result.update(timesteps_this_iter=self.optimizer.num_steps_sampled -
                       prev_steps)
         return result
+
+    def _make_optimizer(self):
+        return AsyncGradientsOptimizer(self.local_evaluator,
+                                       self.remote_evaluators,
+                                       self.config["optimizer"])
diff --git a/python/ray/rllib/agents/a3c/a3c_tf_policy_graph.py b/python/ray/rllib/agents/a3c/a3c_tf_policy_graph.py
index b2298acc9edb6..50258f58ac3aa 100644
--- a/python/ray/rllib/agents/a3c/a3c_tf_policy_graph.py
+++ b/python/ray/rllib/agents/a3c/a3c_tf_policy_graph.py
@@ -10,11 +10,12 @@
 import ray
 from ray.rllib.utils.error import UnsupportedSpaceException
 from ray.rllib.utils.explained_variance import explained_variance
+from ray.rllib.evaluation.policy_graph import PolicyGraph
 from ray.rllib.evaluation.postprocessing import compute_advantages
 from ray.rllib.evaluation.tf_policy_graph import TFPolicyGraph, \
     LearningRateSchedule
-from ray.rllib.models.misc import linear, normc_initializer
 from ray.rllib.models.catalog import ModelCatalog
+from ray.rllib.utils.annotations import override
 
 
 class A3CLoss(object):
@@ -49,12 +50,16 @@ def __init__(self, observation_space, action_space, config):
             tf.float32, [None] + list(observation_space.shape))
         dist_class, logit_dim = ModelCatalog.get_action_dist(
             action_space, self.config["model"])
-        self.model = ModelCatalog.get_model(self.observations, logit_dim,
-                                            self.config["model"])
+        prev_actions = ModelCatalog.get_action_placeholder(action_space)
+        prev_rewards = tf.placeholder(tf.float32, [None], name="prev_reward")
+        self.model = ModelCatalog.get_model({
+            "obs": self.observations,
+            "prev_actions": prev_actions,
+            "prev_rewards": prev_rewards,
+            "is_training": self._get_is_training_placeholder(),
+        }, observation_space, logit_dim, self.config["model"])
         action_dist = dist_class(self.model.outputs)
-        self.vf = tf.reshape(
-            linear(self.model.last_layer, 1, "value", normc_initializer(1.0)),
-            [-1])
+        self.vf = self.model.value_function()
         self.var_list = tf.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES,
                                           tf.get_variable_scope().name)
 
@@ -78,6 +83,8 @@ def __init__(self, observation_space, action_space, config):
         loss_in = [
             ("obs", self.observations),
             ("actions", actions),
+            ("prev_actions", prev_actions),
+            ("prev_rewards", prev_rewards),
             ("advantages", advantages),
             ("value_targets", self.v_target),
         ]
@@ -90,10 +97,12 @@ def __init__(self, observation_space, action_space, config):
             self.sess,
             obs_input=self.observations,
             action_sampler=action_dist.sample(),
-            loss=self.loss.total_loss,
+            loss=self.model.loss() + self.loss.total_loss,
             loss_inputs=loss_in,
             state_inputs=self.model.state_in,
             state_outputs=self.model.state_out,
+            prev_action_input=prev_actions,
+            prev_reward_input=prev_rewards,
             seq_lens=self.model.seq_lens,
             max_seq_len=self.config["model"]["max_seq_len"])
 
@@ -111,31 +120,15 @@ def __init__(self, observation_space, action_space, config):
 
         self.sess.run(tf.global_variables_initializer())
 
-    def extra_compute_action_fetches(self):
-        return {"vf_preds": self.vf}
-
-    def value(self, ob, *args):
-        feed_dict = {self.observations: [ob], self.model.seq_lens: [1]}
-        assert len(args) == len(self.model.state_in), \
-            (args, self.model.state_in)
-        for k, v in zip(self.model.state_in, args):
-            feed_dict[k] = v
-        vf = self.sess.run(self.vf, feed_dict)
-        return vf[0]
-
-    def gradients(self, optimizer):
-        grads = tf.gradients(self.loss.total_loss, self.var_list)
-        self.grads, _ = tf.clip_by_global_norm(grads, self.config["grad_clip"])
-        clipped_grads = list(zip(self.grads, self.var_list))
-        return clipped_grads
-
-    def extra_compute_grad_fetches(self):
-        return self.stats_fetches
-
+    @override(PolicyGraph)
     def get_initial_state(self):
         return self.model.state_init
 
-    def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
+    @override(PolicyGraph)
+    def postprocess_trajectory(self,
+                               sample_batch,
+                               other_agent_batches=None,
+                               episode=None):
         completed = sample_batch["dones"][-1]
         if completed:
             last_r = 0.0
@@ -143,6 +136,30 @@ def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
             next_state = []
             for i in range(len(self.model.state_in)):
                 next_state.append([sample_batch["state_out_{}".format(i)][-1]])
-            last_r = self.value(sample_batch["new_obs"][-1], *next_state)
+            last_r = self._value(sample_batch["new_obs"][-1], *next_state)
         return compute_advantages(sample_batch, last_r, self.config["gamma"],
                                   self.config["lambda"])
+
+    @override(TFPolicyGraph)
+    def gradients(self, optimizer):
+        grads = tf.gradients(self.loss.total_loss, self.var_list)
+        self.grads, _ = tf.clip_by_global_norm(grads, self.config["grad_clip"])
+        clipped_grads = list(zip(self.grads, self.var_list))
+        return clipped_grads
+
+    @override(TFPolicyGraph)
+    def extra_compute_grad_fetches(self):
+        return self.stats_fetches
+
+    @override(TFPolicyGraph)
+    def extra_compute_action_fetches(self):
+        return {"vf_preds": self.vf}
+
+    def _value(self, ob, *args):
+        feed_dict = {self.observations: [ob], self.model.seq_lens: [1]}
+        assert len(args) == len(self.model.state_in), \
+            (args, self.model.state_in)
+        for k, v in zip(self.model.state_in, args):
+            feed_dict[k] = v
+        vf = self.sess.run(self.vf, feed_dict)
+        return vf[0]
diff --git a/python/ray/rllib/agents/a3c/a3c_torch_policy_graph.py b/python/ray/rllib/agents/a3c/a3c_torch_policy_graph.py
index dcdada591a053..c24340d8d10a0 100644
--- a/python/ray/rllib/agents/a3c/a3c_torch_policy_graph.py
+++ b/python/ray/rllib/agents/a3c/a3c_torch_policy_graph.py
@@ -10,7 +10,9 @@
 from ray.rllib.models.pytorch.misc import var_to_np
 from ray.rllib.models.catalog import ModelCatalog
 from ray.rllib.evaluation.postprocessing import compute_advantages
+from ray.rllib.evaluation.policy_graph import PolicyGraph
 from ray.rllib.evaluation.torch_policy_graph import TorchPolicyGraph
+from ray.rllib.utils.annotations import override
 
 
 class A3CLoss(nn.Module):
@@ -56,13 +58,19 @@ def __init__(self, obs_space, action_space, config):
             loss,
             loss_inputs=["obs", "actions", "advantages", "value_targets"])
 
+    @override(TorchPolicyGraph)
     def extra_action_out(self, model_out):
         return {"vf_preds": var_to_np(model_out[1])}
 
+    @override(TorchPolicyGraph)
     def optimizer(self):
         return torch.optim.Adam(self.model.parameters(), lr=self.config["lr"])
 
-    def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
+    @override(PolicyGraph)
+    def postprocess_trajectory(self,
+                               sample_batch,
+                               other_agent_batches=None,
+                               episode=None):
         completed = sample_batch["dones"][-1]
         if completed:
             last_r = 0.0
diff --git a/python/ray/rllib/agents/agent.py b/python/ray/rllib/agents/agent.py
index 030ae64248d87..8e6797eede032 100644
--- a/python/ray/rllib/agents/agent.py
+++ b/python/ray/rllib/agents/agent.py
@@ -2,32 +2,92 @@
 from __future__ import division
 from __future__ import print_function
 
+from datetime import datetime
 import copy
-import json
+import logging
 import os
 import pickle
+import six
 import tempfile
-from datetime import datetime
 import tensorflow as tf
 
 import ray
+from ray.rllib.models import MODEL_DEFAULTS
 from ray.rllib.evaluation.policy_evaluator import PolicyEvaluator
 from ray.rllib.optimizers.policy_optimizer import PolicyOptimizer
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils import FilterManager, deep_update, merge_dicts
-from ray.tune.registry import ENV_CREATOR, _global_registry
+from ray.tune.registry import ENV_CREATOR, register_env, _global_registry
 from ray.tune.trainable import Trainable
+from ray.tune.trial import Resources
 from ray.tune.logger import UnifiedLogger
 from ray.tune.result import DEFAULT_RESULTS_DIR
 
+logger = logging.getLogger(__name__)
+
+# yapf: disable
+# __sphinx_doc_begin__
 COMMON_CONFIG = {
+    # === Debugging ===
+    # Whether to write episode stats and videos to the agent log dir
+    "monitor": False,
+    # Set the ray.rllib.* log level for the agent process and its evaluators
+    "log_level": "INFO",
+    # Callbacks that will be run during various phases of training. These all
+    # take a single "info" dict as an argument. For episode callbacks, custom
+    # metrics can be attached to the episode by updating the episode object's
+    # custom metrics dict (see examples/custom_metrics_and_callbacks.py).
+    "callbacks": {
+        "on_episode_start": None,  # arg: {"env": .., "episode": ...}
+        "on_episode_step": None,   # arg: {"env": .., "episode": ...}
+        "on_episode_end": None,    # arg: {"env": .., "episode": ...}
+        "on_sample_end": None,     # arg: {"samples": .., "evaluator": ...}
+        "on_train_result": None,   # arg: {"agent": ..., "result": ...}
+    },
+
+    # === Policy ===
+    # Arguments to pass to model. See models/catalog.py for a full list of the
+    # available model options.
+    "model": MODEL_DEFAULTS,
+    # Arguments to pass to the policy optimizer. These vary by optimizer.
+    "optimizer": {},
+
+    # === Environment ===
     # Discount factor of the MDP
     "gamma": 0.99,
-    # Number of steps after which the rollout gets cut
+    # Number of steps after which the episode is forced to terminate
     "horizon": None,
-    # Number of environments to evaluate vectorwise per worker.
-    "num_envs_per_worker": 1,
+    # Arguments to pass to the env creator
+    "env_config": {},
+    # Environment name can also be passed via config
+    "env": None,
+    # Whether to clip rewards prior to experience postprocessing. Setting to
+    # None means clip for Atari only.
+    "clip_rewards": None,
+    # Whether to np.clip() actions to the action space low/high range spec.
+    "clip_actions": True,
+    # Whether to use rllib or deepmind preprocessors by default
+    "preprocessor_pref": "deepmind",
+
+    # === Resources ===
     # Number of actors used for parallelism
     "num_workers": 2,
+    # Number of GPUs to allocate to the driver. Note that not all algorithms
+    # can take advantage of driver GPUs. This can be fraction (e.g., 0.3 GPUs).
+    "num_gpus": 0,
+    # Number of CPUs to allocate per worker.
+    "num_cpus_per_worker": 1,
+    # Number of GPUs to allocate per worker. This can be fractional.
+    "num_gpus_per_worker": 0,
+    # Any custom resources to allocate per worker.
+    "custom_resources_per_worker": {},
+    # Number of CPUs to allocate for the driver. Note: this only takes effect
+    # when running in Tune.
+    "num_cpus_for_driver": 1,
+
+    # === Execution ===
+    # Number of environments to evaluate vectorwise per worker.
+    "num_envs_per_worker": 1,
     # Default sample batch size
     "sample_batch_size": 200,
     # Training batch size, if applicable. Should be >= sample_batch_size.
@@ -37,30 +97,15 @@
     "batch_mode": "truncate_episodes",
     # Whether to use a background thread for sampling (slightly off-policy)
     "sample_async": False,
-    # Which observation filter to apply to the observation
+    # Element-wise observation filter, either "NoFilter" or "MeanStdFilter"
     "observation_filter": "NoFilter",
     # Whether to synchronize the statistics of remote filters.
     "synchronize_filters": True,
-    # Whether to clip rewards prior to experience postprocessing. Setting to
-    # None means clip for Atari only.
-    "clip_rewards": None,
-    # Whether to use rllib or deepmind preprocessors
-    "preprocessor_pref": "deepmind",
-    # Arguments to pass to the env creator
-    "env_config": {},
-    # Environment name can also be passed via config
-    "env": None,
-    # Arguments to pass to model
-    "model": {
-        "use_lstm": False,
-        "max_seq_len": 20,
-    },
-    # Arguments to pass to the rllib optimizer
-    "optimizer": {},
     # Configure TF for single-process operation by default
     "tf_session_args": {
-        "intra_op_parallelism_threads": 1,
-        "inter_op_parallelism_threads": 1,
+        # note: overriden by `local_evaluator_tf_session_args`
+        "intra_op_parallelism_threads": 2,
+        "inter_op_parallelism_threads": 2,
         "gpu_options": {
             "allow_growth": True,
         },
@@ -70,12 +115,17 @@
         },
         "allow_soft_placement": True,  # required by PPO multi-gpu
     },
+    # Override the following tf session args on the local evaluator
+    "local_evaluator_tf_session_args": {
+        # Allow a higher level of parallelism by default, but not unlimited
+        # since that can cause crashes with many concurrent drivers.
+        "intra_op_parallelism_threads": 8,
+        "inter_op_parallelism_threads": 8,
+    },
     # Whether to LZ4 compress observations
     "compress_observations": False,
-    # Whether to write episode stats and videos to the agent log dir
-    "monitor": False,
-    # Allocate a fraction of a GPU instead of one (e.g., 0.3 GPUs)
-    "gpu_fraction": 1,
+    # Drop metric batches from unresponsive workers after this many seconds
+    "collect_metrics_timeout": 180,
 
     # === Multiagent ===
     "multiagent": {
@@ -88,6 +138,8 @@
         "policies_to_train": None,
     },
 }
+# __sphinx_doc_end__
+# yapf: enable
 
 
 def with_common_config(extra_config):
@@ -115,68 +167,6 @@ class Agent(Trainable):
         "tf_session_args", "env_config", "model", "optimizer", "multiagent"
     ]
 
-    def make_local_evaluator(self, env_creator, policy_graph):
-        """Convenience method to return configured local evaluator."""
-
-        return self._make_evaluator(
-            PolicyEvaluator,
-            env_creator,
-            policy_graph,
-            0,
-            # important: allow local tf to use multiple CPUs for optimization
-            merge_dicts(
-                self.config, {
-                    "tf_session_args": {
-                        "intra_op_parallelism_threads": None,
-                        "inter_op_parallelism_threads": None,
-                    }
-                }))
-
-    def make_remote_evaluators(self, env_creator, policy_graph, count,
-                               remote_args):
-        """Convenience method to return a number of remote evaluators."""
-
-        cls = PolicyEvaluator.as_remote(**remote_args).remote
-        return [
-            self._make_evaluator(cls, env_creator, policy_graph, i + 1,
-                                 self.config) for i in range(count)
-        ]
-
-    def _make_evaluator(self, cls, env_creator, policy_graph, worker_index,
-                        config):
-        def session_creator():
-            return tf.Session(
-                config=tf.ConfigProto(**config["tf_session_args"]))
-
-        return cls(
-            env_creator,
-            self.config["multiagent"]["policy_graphs"] or policy_graph,
-            policy_mapping_fn=self.config["multiagent"]["policy_mapping_fn"],
-            policies_to_train=self.config["multiagent"]["policies_to_train"],
-            tf_session_creator=(session_creator
-                                if config["tf_session_args"] else None),
-            batch_steps=config["sample_batch_size"],
-            batch_mode=config["batch_mode"],
-            episode_horizon=config["horizon"],
-            preprocessor_pref=config["preprocessor_pref"],
-            sample_async=config["sample_async"],
-            compress_observations=config["compress_observations"],
-            num_envs=config["num_envs_per_worker"],
-            observation_filter=config["observation_filter"],
-            clip_rewards=config["clip_rewards"],
-            env_config=config["env_config"],
-            model_config=config["model"],
-            policy_config=config,
-            worker_index=worker_index,
-            monitor_path=self.logdir if config["monitor"] else None)
-
-    @classmethod
-    def resource_help(cls, config):
-        return ("\n\nYou can adjust the resource requests of RLlib agents by "
-                "setting `num_workers` and other configs. See the "
-                "DEFAULT_CONFIG defined by each agent for more info.\n\n"
-                "The config of this agent is: " + json.dumps(config))
-
     def __init__(self, config=None, env=None, logger_creator=None):
         """Initialize an RLLib agent.
 
@@ -189,17 +179,19 @@ def __init__(self, config=None, env=None, logger_creator=None):
         """
 
         config = config or {}
+        Agent._validate_config(config)
 
         # Vars to synchronize to evaluators on each train call
         self.global_vars = {"timestep": 0}
 
         # Agents allow env ids to be passed directly to the constructor.
-        self._env_id = env or config.get("env")
+        self._env_id = _register_if_needed(env or config.get("env"))
 
         # Create a default logger creator if no logger_creator is specified
         if logger_creator is None:
             timestr = datetime.today().strftime("%Y-%m-%d_%H-%M-%S")
-            logdir_prefix = '_'.join([self._agent_name, self._env_id, timestr])
+            logdir_prefix = "{}_{}_{}".format(self._agent_name, self._env_id,
+                                              timestr)
 
             def default_logger_creator(config):
                 """Creates a Unified logger with a default logdir prefix
@@ -215,6 +207,19 @@ def default_logger_creator(config):
 
         Trainable.__init__(self, config, logger_creator)
 
+    @classmethod
+    @override(Trainable)
+    def default_resource_request(cls, config):
+        cf = dict(cls._default_config, **config)
+        Agent._validate_config(cf)
+        # TODO(ekl): add custom resources here once tune supports them
+        return Resources(
+            cpu=cf["num_cpus_for_driver"],
+            gpu=cf["num_gpus"],
+            extra_cpu=cf["num_cpus_per_worker"] * cf["num_workers"],
+            extra_gpu=cf["num_gpus_per_worker"] * cf["num_workers"])
+
+    @override(Trainable)
     def train(self):
         """Overrides super.train to synchronize global vars."""
 
@@ -224,6 +229,7 @@ def train(self):
             self.optimizer.local_evaluator.set_global_vars(self.global_vars)
             for ev in self.optimizer.remote_evaluators:
                 ev.set_global_vars.remote(self.global_vars)
+            logger.debug("updated global vars: {}".format(self.global_vars))
 
         if (self.config.get("observation_filter", "NoFilter") != "NoFilter"
                 and hasattr(self, "local_evaluator")):
@@ -231,13 +237,22 @@ def train(self):
                 self.local_evaluator.filters,
                 self.remote_evaluators,
                 update_remote=self.config["synchronize_filters"])
-
-        return Trainable.train(self)
-
-    def _setup(self):
+            logger.debug("synchronized filters: {}".format(
+                self.local_evaluator.filters))
+
+        result = Trainable.train(self)
+        if self.config["callbacks"].get("on_train_result"):
+            self.config["callbacks"]["on_train_result"]({
+                "agent": self,
+                "result": result,
+            })
+        return result
+
+    @override(Trainable)
+    def _setup(self, config):
         env = self._env_id
         if env:
-            self.config["env"] = env
+            config["env"] = env
             if _global_registry.contains(ENV_CREATOR, env):
                 self.env_creator = _global_registry.get(ENV_CREATOR, env)
             else:
@@ -247,36 +262,41 @@ def _setup(self):
             self.env_creator = lambda env_config: None
 
         # Merge the supplied config with the class default
-        merged_config = self._default_config.copy()
-        merged_config = deep_update(merged_config, self.config,
+        merged_config = copy.deepcopy(self._default_config)
+        merged_config = deep_update(merged_config, config,
                                     self._allow_unknown_configs,
                                     self._allow_unknown_subkeys)
         self.config = merged_config
+        if self.config.get("log_level"):
+            logging.getLogger("ray.rllib").setLevel(self.config["log_level"])
 
         # TODO(ekl) setting the graph is unnecessary for PyTorch agents
         with tf.Graph().as_default():
             self._init()
 
-    def _init(self):
-        """Subclasses should override this for custom initialization."""
-
-        raise NotImplementedError
-
-    @property
-    def iteration(self):
-        """Current training iter, auto-incremented with each train() call."""
-
-        return self._iteration
+    @override(Trainable)
+    def _stop(self):
+        # workaround for https://github.com/ray-project/ray/issues/1516
+        if hasattr(self, "remote_evaluators"):
+            for ev in self.remote_evaluators:
+                ev.__ray_terminate__.remote()
+        if hasattr(self, "optimizer"):
+            self.optimizer.stop()
 
-    @property
-    def _agent_name(self):
-        """Subclasses should override this to declare their name."""
+    @override(Trainable)
+    def _save(self, checkpoint_dir):
+        checkpoint_path = os.path.join(checkpoint_dir,
+                                       "checkpoint-{}".format(self.iteration))
+        pickle.dump(self.__getstate__(), open(checkpoint_path, "wb"))
+        return checkpoint_path
 
-        raise NotImplementedError
+    @override(Trainable)
+    def _restore(self, checkpoint_path):
+        extra_data = pickle.load(open(checkpoint_path, "rb"))
+        self.__setstate__(extra_data)
 
-    @property
-    def _default_config(self):
-        """Subclasses should override this to declare their default config."""
+    def _init(self):
+        """Subclasses should override this for custom initialization."""
 
         raise NotImplementedError
 
@@ -299,13 +319,29 @@ def compute_action(self, observation, state=None, policy_id="default"):
             observation, update=False)
         if state:
             return self.local_evaluator.for_policy(
-                lambda p: p.compute_single_action(
-                    filtered_obs, state, is_training=False),
+                lambda p: p.compute_single_action(filtered_obs, state),
                 policy_id=policy_id)
         return self.local_evaluator.for_policy(
-                lambda p: p.compute_single_action(
-                    filtered_obs, state, is_training=False)[0],
-                policy_id=policy_id)
+            lambda p: p.compute_single_action(filtered_obs, state)[0],
+            policy_id=policy_id)
+
+    @property
+    def iteration(self):
+        """Current training iter, auto-incremented with each train() call."""
+
+        return self._iteration
+
+    @property
+    def _agent_name(self):
+        """Subclasses should override this to declare their name."""
+
+        raise NotImplementedError
+
+    @property
+    def _default_config(self):
+        """Subclasses should override this to declare their default config."""
+
+        raise NotImplementedError
 
     def get_weights(self, policies=None):
         """Return a dictionary of policy ids to weights.
@@ -324,11 +360,89 @@ def set_weights(self, weights):
         """
         self.local_evaluator.set_weights(weights)
 
-    def _stop(self):
-        # workaround for https://github.com/ray-project/ray/issues/1516
-        if hasattr(self, "remote_evaluators"):
-            for ev in self.remote_evaluators:
-                ev.__ray_terminate__.remote()
+    def make_local_evaluator(self, env_creator, policy_graph):
+        """Convenience method to return configured local evaluator."""
+
+        return self._make_evaluator(
+            PolicyEvaluator,
+            env_creator,
+            policy_graph,
+            0,
+            # important: allow local tf to use more CPUs for optimization
+            merge_dicts(self.config, {
+                "tf_session_args": self.
+                config["local_evaluator_tf_session_args"]
+            }))
+
+    def make_remote_evaluators(self, env_creator, policy_graph, count):
+        """Convenience method to return a number of remote evaluators."""
+
+        remote_args = {
+            "num_cpus": self.config["num_cpus_per_worker"],
+            "num_gpus": self.config["num_gpus_per_worker"],
+            "resources": self.config["custom_resources_per_worker"],
+        }
+
+        cls = PolicyEvaluator.as_remote(**remote_args).remote
+        return [
+            self._make_evaluator(cls, env_creator, policy_graph, i + 1,
+                                 self.config) for i in range(count)
+        ]
+
+    def _make_evaluator(self, cls, env_creator, policy_graph, worker_index,
+                        config):
+        def session_creator():
+            logger.debug("Creating TF session {}".format(
+                config["tf_session_args"]))
+            return tf.Session(
+                config=tf.ConfigProto(**config["tf_session_args"]))
+
+        return cls(
+            env_creator,
+            self.config["multiagent"]["policy_graphs"] or policy_graph,
+            policy_mapping_fn=self.config["multiagent"]["policy_mapping_fn"],
+            policies_to_train=self.config["multiagent"]["policies_to_train"],
+            tf_session_creator=(session_creator
+                                if config["tf_session_args"] else None),
+            batch_steps=config["sample_batch_size"],
+            batch_mode=config["batch_mode"],
+            episode_horizon=config["horizon"],
+            preprocessor_pref=config["preprocessor_pref"],
+            sample_async=config["sample_async"],
+            compress_observations=config["compress_observations"],
+            num_envs=config["num_envs_per_worker"],
+            observation_filter=config["observation_filter"],
+            clip_rewards=config["clip_rewards"],
+            clip_actions=config["clip_actions"],
+            env_config=config["env_config"],
+            model_config=config["model"],
+            policy_config=config,
+            worker_index=worker_index,
+            monitor_path=self.logdir if config["monitor"] else None,
+            log_level=config["log_level"],
+            callbacks=config["callbacks"])
+
+    @classmethod
+    def resource_help(cls, config):
+        return ("\n\nYou can adjust the resource requests of RLlib agents by "
+                "setting `num_workers` and other configs. See the "
+                "DEFAULT_CONFIG defined by each agent for more info.\n\n"
+                "The config of this agent is: {}".format(config))
+
+    @staticmethod
+    def _validate_config(config):
+        if "gpu" in config:
+            raise ValueError(
+                "The `gpu` config is deprecated, please use `num_gpus=0|1` "
+                "instead.")
+        if "gpu_fraction" in config:
+            raise ValueError(
+                "The `gpu_fraction` config is deprecated, please use "
+                "`num_gpus=<fraction>` instead.")
+        if "use_gpu_for_workers" in config:
+            raise ValueError(
+                "The `use_gpu_for_workers` config is deprecated, please use "
+                "`num_gpus_per_worker=1` instead.")
 
     def __getstate__(self):
         state = {}
@@ -347,16 +461,14 @@ def __setstate__(self, state):
         if "optimizer" in state:
             self.optimizer.restore(state["optimizer"])
 
-    def _save(self, checkpoint_dir):
-        checkpoint_path = os.path.join(checkpoint_dir,
-                                       "checkpoint-{}".format(self.iteration))
-        pickle.dump(self.__getstate__(),
-                    open(checkpoint_path + ".agent_state", "wb"))
-        return checkpoint_path
 
-    def _restore(self, checkpoint_path):
-        extra_data = pickle.load(open(checkpoint_path + ".agent_state", "rb"))
-        self.__setstate__(extra_data)
+def _register_if_needed(env_object):
+    if isinstance(env_object, six.string_types):
+        return env_object
+    elif isinstance(env_object, type):
+        name = env_object.__name__
+        register_env(name, lambda config: env_object(config))
+        return name
 
 
 def get_agent_class(alg):
@@ -389,9 +501,6 @@ def get_agent_class(alg):
     elif alg == "A2C":
         from ray.rllib.agents import a3c
         return a3c.A2CAgent
-    elif alg == "BC":
-        from ray.rllib.agents import bc
-        return bc.BCAgent
     elif alg == "PG":
         from ray.rllib.agents import pg
         return pg.PGAgent
diff --git a/python/ray/rllib/agents/ars/ars.py b/python/ray/rllib/agents/ars/ars.py
index e1a9459857716..1b39a79d0c13b 100644
--- a/python/ray/rllib/agents/ars/ars.py
+++ b/python/ray/rllib/agents/ars/ars.py
@@ -7,38 +7,42 @@
 from __future__ import print_function
 
 from collections import namedtuple
+import logging
 import numpy as np
 import time
 
 import ray
 from ray.rllib.agents import Agent, with_common_config
-from ray.tune.trial import Resources
 
 from ray.rllib.agents.ars import optimizers
 from ray.rllib.agents.ars import policies
-from ray.rllib.agents.es import tabular_logger as tlogger
 from ray.rllib.agents.ars import utils
+from ray.rllib.utils.annotations import override
+from ray.rllib.utils import FilterManager
+
+logger = logging.getLogger(__name__)
 
 Result = namedtuple("Result", [
     "noise_indices", "noisy_returns", "sign_noisy_returns", "noisy_lengths",
     "eval_returns", "eval_lengths"
 ])
 
+# yapf: disable
+# __sphinx_doc_begin__
 DEFAULT_CONFIG = with_common_config({
-    'noise_stdev': 0.02,  # std deviation of parameter noise
-    'num_rollouts': 32,  # number of perturbs to try
-    'rollouts_used': 32,  # number of perturbs to keep in gradient estimate
-    'num_workers': 2,
-    'sgd_stepsize': 0.01,  # sgd step-size
-    'observation_filter': "MeanStdFilter",
-    'noise_size': 250000000,
-    'eval_prob': 0.03,  # probability of evaluating the parameter rewards
-    'report_length': 10,  # how many of the last rewards we average over
-    'env_config': {},
-    'offset': 0,
-    'policy_type': "LinearPolicy",  # ["LinearPolicy", "MLPPolicy"]
-    "fcnet_hiddens": [32, 32],  # fcnet structure of MLPPolicy
+    "noise_stdev": 0.02,  # std deviation of parameter noise
+    "num_rollouts": 32,  # number of perturbs to try
+    "rollouts_used": 32,  # number of perturbs to keep in gradient estimate
+    "num_workers": 2,
+    "sgd_stepsize": 0.01,  # sgd step-size
+    "observation_filter": "MeanStdFilter",
+    "noise_size": 250000000,
+    "eval_prob": 0.03,  # probability of evaluating the parameter rewards
+    "report_length": 10,  # how many of the last rewards we average over
+    "offset": 0,
 })
+# __sphinx_doc_end__
+# yapf: enable
 
 
 @ray.remote
@@ -67,15 +71,9 @@ def get_delta(self, dim):
 
 @ray.remote
 class Worker(object):
-    def __init__(self,
-                 config,
-                 policy_params,
-                 env_creator,
-                 noise,
-                 min_task_runtime=0.2):
+    def __init__(self, config, env_creator, noise, min_task_runtime=0.2):
         self.min_task_runtime = min_task_runtime
         self.config = config
-        self.policy_params = policy_params
         self.noise = SharedNoiseTable(noise)
 
         self.env = env_creator(config["env_config"])
@@ -83,15 +81,25 @@ def __init__(self,
         self.preprocessor = models.ModelCatalog.get_preprocessor(self.env)
 
         self.sess = utils.make_session(single_threaded=True)
-        if config["policy_type"] == "LinearPolicy":
-            self.policy = policies.LinearPolicy(
-                self.sess, self.env.action_space, self.preprocessor,
-                config["observation_filter"], **policy_params)
-        else:
-            self.policy = policies.MLPPolicy(
-                self.sess, self.env.action_space, self.preprocessor,
-                config["observation_filter"], config["fcnet_hiddens"],
-                **policy_params)
+        self.policy = policies.GenericPolicy(
+            self.sess, self.env.action_space, self.env.observation_space,
+            self.preprocessor, config["observation_filter"], config["model"])
+
+    @property
+    def filters(self):
+        return {"default": self.policy.get_filter()}
+
+    def sync_filters(self, new_filters):
+        for k in self.filters:
+            self.filters[k].sync(new_filters[k])
+
+    def get_filters(self, flush_after=False):
+        return_filters = {}
+        for k, f in self.filters.items():
+            return_filters[k] = f.as_serializable()
+            if flush_after:
+                f.clear_buffer()
+        return return_filters
 
     def rollout(self, timestep_limit, add_noise=False):
         rollout_rewards, rollout_length = policies.rollout(
@@ -154,31 +162,16 @@ class ARSAgent(Agent):
     _agent_name = "ARS"
     _default_config = DEFAULT_CONFIG
 
-    @classmethod
-    def default_resource_request(cls, config):
-        cf = dict(cls._default_config, **config)
-        return Resources(cpu=1, gpu=0, extra_cpu=cf["num_workers"])
-
+    @override(Agent)
     def _init(self):
-        policy_params = {"action_noise_std": 0.0}
-
-        # register the linear network
-        utils.register_linear_network()
-
         env = self.env_creator(self.config["env_config"])
         from ray.rllib import models
         preprocessor = models.ModelCatalog.get_preprocessor(env)
 
         self.sess = utils.make_session(single_threaded=False)
-        if self.config["policy_type"] == "LinearPolicy":
-            self.policy = policies.LinearPolicy(
-                self.sess, env.action_space, preprocessor,
-                self.config["observation_filter"], **policy_params)
-        else:
-            self.policy = policies.MLPPolicy(
-                self.sess, env.action_space, preprocessor,
-                self.config["observation_filter"],
-                self.config["fcnet_hiddens"], **policy_params)
+        self.policy = policies.GenericPolicy(
+            self.sess, env.action_space, env.observation_space, preprocessor,
+            self.config["observation_filter"], self.config["model"])
         self.optimizer = optimizers.SGD(self.policy,
                                         self.config["sgd_stepsize"])
 
@@ -187,41 +180,22 @@ def _init(self):
         self.report_length = self.config["report_length"]
 
         # Create the shared noise table.
-        print("Creating shared noise table.")
+        logger.info("Creating shared noise table.")
         noise_id = create_shared_noise.remote(self.config["noise_size"])
         self.noise = SharedNoiseTable(ray.get(noise_id))
 
         # Create the actors.
-        print("Creating actors.")
+        logger.info("Creating actors.")
         self.workers = [
-            Worker.remote(self.config, policy_params, self.env_creator,
-                          noise_id) for _ in range(self.config["num_workers"])
+            Worker.remote(self.config, self.env_creator, noise_id)
+            for _ in range(self.config["num_workers"])
         ]
 
         self.episodes_so_far = 0
         self.reward_list = []
         self.tstart = time.time()
 
-    def _collect_results(self, theta_id, min_episodes):
-        num_episodes, num_timesteps = 0, 0
-        results = []
-        while num_episodes < min_episodes:
-            print("Collected {} episodes {} timesteps so far this iter".format(
-                num_episodes, num_timesteps))
-            rollout_ids = [
-                worker.do_rollouts.remote(theta_id) for worker in self.workers
-            ]
-            # Get the results of the rollouts.
-            for result in ray.get(rollout_ids):
-                results.append(result)
-                # Update the number of episodes and the number of timesteps
-                # keeping in mind that result.noisy_lengths is a list of lists,
-                # where the inner lists have length 2.
-                num_episodes += sum(len(pair) for pair in result.noisy_lengths)
-                num_timesteps += sum(
-                    sum(pair) for pair in result.noisy_lengths)
-        return results, num_episodes, num_timesteps
-
+    @override(Agent)
     def _train(self):
         config = self.config
 
@@ -287,7 +261,6 @@ def _train(self):
             g /= np.std(noisy_returns)
         assert (g.shape == (self.policy.num_params, )
                 and g.dtype == np.float32)
-        print('the number of policy params is, ', self.policy.num_params)
         # Compute the new weights theta.
         theta, update_ratio = self.optimizer.update(-g)
         # Set the new weights in the local copy of the policy.
@@ -296,18 +269,14 @@ def _train(self):
         if len(all_eval_returns) > 0:
             self.reward_list.append(eval_returns.mean())
 
-        tlogger.record_tabular("NoisyEpRewMean", noisy_returns.mean())
-        tlogger.record_tabular("NoisyEpRewStd", noisy_returns.std())
-        tlogger.record_tabular("NoisyEpLenMean", noisy_lengths.mean())
-
-        tlogger.record_tabular("WeightsNorm", float(np.square(theta).sum()))
-        tlogger.record_tabular("WeightsStd", float(np.std(theta)))
-        tlogger.record_tabular("Grad2Norm", float(np.sqrt(np.square(g).sum())))
-        tlogger.record_tabular("UpdateRatio", float(update_ratio))
-        tlogger.dump_tabular()
+        # Now sync the filters
+        FilterManager.synchronize({
+            "default": self.policy.get_filter()
+        }, self.workers)
 
         info = {
             "weights_norm": np.square(theta).sum(),
+            "weights_std": np.std(theta),
             "grad_norm": np.square(g).sum(),
             "update_ratio": update_ratio,
             "episodes_this_iter": noisy_lengths.size,
@@ -322,20 +291,49 @@ def _train(self):
 
         return result
 
+    @override(Agent)
     def _stop(self):
         # workaround for https://github.com/ray-project/ray/issues/1516
         for w in self.workers:
             w.__ray_terminate__.remote()
 
+    @override(Agent)
+    def compute_action(self, observation):
+        return self.policy.compute(observation, update=True)[0]
+
+    def _collect_results(self, theta_id, min_episodes):
+        num_episodes, num_timesteps = 0, 0
+        results = []
+        while num_episodes < min_episodes:
+            logger.info(
+                "Collected {} episodes {} timesteps so far this iter".format(
+                    num_episodes, num_timesteps))
+            rollout_ids = [
+                worker.do_rollouts.remote(theta_id) for worker in self.workers
+            ]
+            # Get the results of the rollouts.
+            for result in ray.get(rollout_ids):
+                results.append(result)
+                # Update the number of episodes and the number of timesteps
+                # keeping in mind that result.noisy_lengths is a list of lists,
+                # where the inner lists have length 2.
+                num_episodes += sum(len(pair) for pair in result.noisy_lengths)
+                num_timesteps += sum(
+                    sum(pair) for pair in result.noisy_lengths)
+
+        return results, num_episodes, num_timesteps
+
     def __getstate__(self):
         return {
             "weights": self.policy.get_weights(),
+            "filter": self.policy.get_filter(),
             "episodes_so_far": self.episodes_so_far,
         }
 
     def __setstate__(self, state):
-        self.policy.set_weights(state["weights"])
         self.episodes_so_far = state["episodes_so_far"]
-
-    def compute_action(self, observation):
-        return self.policy.compute(observation, update=True)[0]
+        self.policy.set_weights(state["weights"])
+        self.policy.set_filter(state["filter"])
+        FilterManager.synchronize({
+            "default": self.policy.get_filter()
+        }, self.workers)
diff --git a/python/ray/rllib/agents/ars/policies.py b/python/ray/rllib/agents/ars/policies.py
index 3a25d68eb6b3e..27f664655f423 100644
--- a/python/ray/rllib/agents/ars/policies.py
+++ b/python/ray/rllib/agents/ars/policies.py
@@ -10,8 +10,8 @@
 import tensorflow as tf
 
 import ray
+from ray.rllib.evaluation.sampler import _unbatch_tuple_actions
 from ray.rllib.utils.filter import get_filter
-from ray.rllib.utils.error import UnsupportedSpaceException
 from ray.rllib.models import ModelCatalog
 
 
@@ -57,16 +57,11 @@ class GenericPolicy(object):
     def __init__(self,
                  sess,
                  action_space,
+                 obs_space,
                  preprocessor,
                  observation_filter,
-                 action_noise_std,
-                 options={}):
-
-        if len(preprocessor.shape) > 1:
-            raise UnsupportedSpaceException(
-                "Observation space {} is not supported with ARS.".format(
-                    preprocessor.shape))
-
+                 model_config,
+                 action_noise_std=0.0):
         self.sess = sess
         self.action_space = action_space
         self.action_noise_std = action_noise_std
@@ -78,9 +73,11 @@ def __init__(self,
 
         # Policy network.
         dist_class, dist_dim = ModelCatalog.get_action_dist(
-            action_space, dist_type="deterministic")
+            action_space, model_config, dist_type="deterministic")
 
-        model = ModelCatalog.get_model(self.inputs, dist_dim, options=options)
+        model = ModelCatalog.get_model({
+            "obs": self.inputs
+        }, obs_space, dist_dim, model_config)
         dist = dist_class(model.outputs)
         self.sampler = dist.sample()
 
@@ -97,6 +94,7 @@ def compute(self, observation, add_noise=False, update=True):
         observation = self.observation_filter(observation[None], update=update)
         action = self.sess.run(
             self.sampler, feed_dict={self.inputs: observation})
+        action = _unbatch_tuple_actions(action)
         if add_noise and isinstance(self.action_space, gym.spaces.Box):
             action += np.random.randn(*action.shape) * self.action_noise_std
         return action
@@ -104,33 +102,11 @@ def compute(self, observation, add_noise=False, update=True):
     def set_weights(self, x):
         self.variables.set_flat(x)
 
-    def get_weights(self):
-        return self.variables.get_flat()
+    def set_filter(self, obs_filter):
+        self.observation_filter = obs_filter
 
+    def get_filter(self):
+        return self.observation_filter
 
-class LinearPolicy(GenericPolicy):
-    def __init__(self, sess, action_space, preprocessor, observation_filter,
-                 action_noise_std):
-        options = {"custom_model": "LinearNetwork"}
-        GenericPolicy.__init__(
-            self,
-            sess,
-            action_space,
-            preprocessor,
-            observation_filter,
-            action_noise_std,
-            options=options)
-
-
-class MLPPolicy(GenericPolicy):
-    def __init__(self, sess, action_space, preprocessor, observation_filter,
-                 fcnet_hiddens, action_noise_std):
-        options = {"fcnet_hiddens": fcnet_hiddens}
-        GenericPolicy.__init__(
-            self,
-            sess,
-            action_space,
-            preprocessor,
-            observation_filter,
-            action_noise_std,
-            options=options)
+    def get_weights(self):
+        return self.variables.get_flat()
diff --git a/python/ray/rllib/agents/ars/utils.py b/python/ray/rllib/agents/ars/utils.py
index a70dd97bb61a3..1575e46c38370 100644
--- a/python/ray/rllib/agents/ars/utils.py
+++ b/python/ray/rllib/agents/ars/utils.py
@@ -7,9 +7,6 @@
 
 import numpy as np
 import tensorflow as tf
-from ray.rllib.models import ModelCatalog, Model
-import tensorflow.contrib.slim as slim
-from ray.rllib.models.misc import normc_initializer
 
 
 def compute_ranks(x):
@@ -62,21 +59,3 @@ def batched_weighted_sum(weights, vecs, batch_size):
             np.asarray(batch_vecs, dtype=np.float32))
         num_items_summed += len(batch_weights)
     return total, num_items_summed
-
-
-class LinearNetwork(Model):
-    """Generic linear network."""
-
-    def _build_layers(self, inputs, num_outputs, _):
-        with tf.name_scope("linear"):
-            output = slim.fully_connected(
-                inputs,
-                num_outputs,
-                weights_initializer=normc_initializer(0.01),
-                activation_fn=None,
-            )
-            return output, inputs
-
-
-def register_linear_network():
-    ModelCatalog.register_custom_model("LinearNetwork", LinearNetwork)
diff --git a/python/ray/rllib/agents/bc/__init__.py b/python/ray/rllib/agents/bc/__init__.py
deleted file mode 100644
index eb0f8dc2d7dd3..0000000000000
--- a/python/ray/rllib/agents/bc/__init__.py
+++ /dev/null
@@ -1,3 +0,0 @@
-from ray.rllib.agents.bc.bc import BCAgent, DEFAULT_CONFIG
-
-__all__ = ["BCAgent", "DEFAULT_CONFIG"]
diff --git a/python/ray/rllib/agents/bc/bc.py b/python/ray/rllib/agents/bc/bc.py
deleted file mode 100644
index b2552bf990f56..0000000000000
--- a/python/ray/rllib/agents/bc/bc.py
+++ /dev/null
@@ -1,99 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import ray
-from ray.rllib.agents.agent import Agent
-from ray.rllib.agents.bc.bc_evaluator import BCEvaluator, \
-    GPURemoteBCEvaluator, RemoteBCEvaluator
-from ray.rllib.optimizers import AsyncGradientsOptimizer
-from ray.rllib.utils import merge_dicts
-from ray.tune.trial import Resources
-
-DEFAULT_CONFIG = {
-    # Number of workers (excluding master)
-    "num_workers": 1,
-    # Size of rollout batch
-    "batch_size": 100,
-    # Max global norm for each gradient calculated by worker
-    "grad_clip": 40.0,
-    # Learning rate
-    "lr": 0.0001,
-    # Whether to use a GPU for local optimization.
-    "gpu": False,
-    # Whether to place workers on GPUs
-    "use_gpu_for_workers": False,
-    # Model and preprocessor options
-    "model": {
-        # (Image statespace) - Converts image to Channels = 1
-        "grayscale": True,
-        # (Image statespace) - Each pixel
-        "zero_mean": False,
-        # (Image statespace) - Converts image to (dim, dim, C)
-        "dim": 84,
-        # (Image statespace) - Converts image shape to (C, dim, dim)
-        "channel_major": False
-    },
-    # Arguments to pass to the rllib optimizer
-    "optimizer": {
-        # Number of gradients applied for each `train` step
-        "grads_per_step": 100,
-    },
-    # Arguments to pass to the env creator
-    "env_config": {},
-}
-
-
-class BCAgent(Agent):
-    _agent_name = "BC"
-    _default_config = DEFAULT_CONFIG
-    _allow_unknown_configs = True
-
-    @classmethod
-    def default_resource_request(cls, config):
-        cf = merge_dicts(cls._default_config, config)
-        if cf["use_gpu_for_workers"]:
-            num_gpus_per_worker = cf["gpu_fraction"]
-        else:
-            num_gpus_per_worker = 0
-        return Resources(
-            cpu=1,
-            gpu=cf["gpu"] and cf["gpu_fraction"] or 0,
-            extra_cpu=cf["num_workers"],
-            extra_gpu=num_gpus_per_worker * cf["num_workers"])
-
-    def _init(self):
-        self.local_evaluator = BCEvaluator(self.env_creator, self.config,
-                                           self.logdir)
-        if self.config["use_gpu_for_workers"]:
-            remote_cls = GPURemoteBCEvaluator
-        else:
-            remote_cls = RemoteBCEvaluator
-        self.remote_evaluators = [
-            remote_cls.remote(self.env_creator, self.config, self.logdir)
-            for _ in range(self.config["num_workers"])
-        ]
-        self.optimizer = AsyncGradientsOptimizer(self.local_evaluator,
-                                                 self.remote_evaluators,
-                                                 self.config["optimizer"])
-
-    def _train(self):
-        self.optimizer.step()
-        metric_lists = [
-            re.get_metrics.remote() for re in self.remote_evaluators
-        ]
-        total_samples = 0
-        total_loss = 0
-        for metrics in metric_lists:
-            for m in ray.get(metrics):
-                total_samples += m["num_samples"]
-                total_loss += m["loss"]
-        result = dict(
-            mean_loss=total_loss / total_samples,
-            timesteps_this_iter=total_samples,
-        )
-        return result
-
-    def compute_action(self, observation):
-        action, info = self.local_evaluator.policy.compute(observation)
-        return action
diff --git a/python/ray/rllib/agents/bc/bc_evaluator.py b/python/ray/rllib/agents/bc/bc_evaluator.py
deleted file mode 100644
index 4726b4a3cf176..0000000000000
--- a/python/ray/rllib/agents/bc/bc_evaluator.py
+++ /dev/null
@@ -1,64 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import pickle
-from six.moves import queue
-
-import ray
-from ray.rllib.agents.bc.experience_dataset import ExperienceDataset
-from ray.rllib.agents.bc.policy import BCPolicy
-from ray.rllib.evaluation.interface import EvaluatorInterface
-from ray.rllib.models import ModelCatalog
-
-
-class BCEvaluator(EvaluatorInterface):
-    def __init__(self, env_creator, config, logdir):
-        env = ModelCatalog.get_preprocessor_as_wrapper(
-            env_creator(config["env_config"]), config["model"])
-        self.dataset = ExperienceDataset(config["dataset_path"])
-        self.policy = BCPolicy(env.observation_space, env.action_space, config)
-        self.config = config
-        self.logdir = logdir
-        self.metrics_queue = queue.Queue()
-
-    def sample(self):
-        return self.dataset.sample(self.config["batch_size"])
-
-    def compute_gradients(self, samples):
-        gradient, info = self.policy.compute_gradients(samples)
-        self.metrics_queue.put({
-            "num_samples": info["num_samples"],
-            "loss": info["loss"]
-        })
-        return gradient, {}
-
-    def apply_gradients(self, grads):
-        self.policy.apply_gradients(grads)
-
-    def get_weights(self):
-        return self.policy.get_weights()
-
-    def set_weights(self, params):
-        self.policy.set_weights(params)
-
-    def save(self):
-        weights = self.get_weights()
-        return pickle.dumps({"weights": weights})
-
-    def restore(self, objs):
-        objs = pickle.loads(objs)
-        self.set_weights(objs["weights"])
-
-    def get_metrics(self):
-        completed = []
-        while True:
-            try:
-                completed.append(self.metrics_queue.get_nowait())
-            except queue.Empty:
-                break
-        return completed
-
-
-RemoteBCEvaluator = ray.remote(BCEvaluator)
-GPURemoteBCEvaluator = ray.remote(num_gpus=1)(BCEvaluator)
diff --git a/python/ray/rllib/agents/bc/experience_dataset.py b/python/ray/rllib/agents/bc/experience_dataset.py
deleted file mode 100644
index d082841842698..0000000000000
--- a/python/ray/rllib/agents/bc/experience_dataset.py
+++ /dev/null
@@ -1,34 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import itertools
-import pickle
-
-import numpy as np
-
-
-class ExperienceDataset(object):
-    def __init__(self, dataset_path):
-        """Create dataset of experience to imitate.
-
-        Parameters
-        ----------
-        dataset_path:
-          Path of file containing the database as pickled list of trajectories,
-          each trajectory being a list of steps,
-          each step containing the observation and action as its first two
-            elements.
-          The file must be available on each machine used by a BCEvaluator.
-        """
-        self._dataset = list(
-            itertools.chain.from_iterable(
-                pickle.load(open(dataset_path, "rb"))))
-
-    def sample(self, batch_size):
-        indexes = np.random.choice(len(self._dataset), batch_size)
-        samples = {
-            'observations': [self._dataset[i][0] for i in indexes],
-            'actions': [self._dataset[i][1] for i in indexes]
-        }
-        return samples
diff --git a/python/ray/rllib/agents/bc/policy.py b/python/ray/rllib/agents/bc/policy.py
deleted file mode 100644
index a504e3ec64ff8..0000000000000
--- a/python/ray/rllib/agents/bc/policy.py
+++ /dev/null
@@ -1,106 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import tensorflow as tf
-import gym
-
-import ray
-from ray.rllib.models.catalog import ModelCatalog
-
-
-class BCPolicy(object):
-    def __init__(self, obs_space, action_space, config):
-        self.local_steps = 0
-        self.config = config
-        self.summarize = config.get("summarize")
-        self._setup_graph(obs_space, action_space)
-        self.setup_loss(action_space)
-        self.setup_gradients()
-        self.initialize()
-
-    def _setup_graph(self, obs_space, ac_space):
-        self.x = tf.placeholder(tf.float32, [None] + list(obs_space.shape))
-        dist_class, self.logit_dim = ModelCatalog.get_action_dist(
-            ac_space, self.config["model"])
-        self._model = ModelCatalog.get_model(self.x, self.logit_dim,
-                                             self.config["model"])
-        self.logits = self._model.outputs
-        self.curr_dist = dist_class(self.logits)
-        self.sample = self.curr_dist.sample()
-        self.var_list = tf.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES,
-                                          tf.get_variable_scope().name)
-
-    def setup_loss(self, action_space):
-        if isinstance(action_space, gym.spaces.Box):
-            self.ac = tf.placeholder(
-                tf.float32, [None] + list(action_space.shape), name="ac")
-        elif isinstance(action_space, gym.spaces.Discrete):
-            self.ac = tf.placeholder(tf.int64, [None], name="ac")
-        else:
-            raise NotImplementedError("action space" +
-                                      str(type(action_space)) +
-                                      "currently not supported")
-        log_prob = self.curr_dist.logp(self.ac)
-        self.pi_loss = -tf.reduce_sum(log_prob)
-        self.loss = self.pi_loss
-
-    def setup_gradients(self):
-        grads = tf.gradients(self.loss, self.var_list)
-        self.grads, _ = tf.clip_by_global_norm(grads, self.config["grad_clip"])
-        grads_and_vars = list(zip(self.grads, self.var_list))
-        opt = tf.train.AdamOptimizer(self.config["lr"])
-        self._apply_gradients = opt.apply_gradients(grads_and_vars)
-
-    def initialize(self):
-        if self.summarize:
-            bs = tf.to_float(tf.shape(self.x)[0])
-            tf.summary.scalar("model/policy_loss", self.pi_loss / bs)
-            tf.summary.scalar("model/grad_gnorm", tf.global_norm(self.grads))
-            tf.summary.scalar("model/var_gnorm", tf.global_norm(self.var_list))
-            self.summary_op = tf.summary.merge_all()
-
-        # TODO(rliaw): Can consider exposing these parameters
-        self.sess = tf.Session(
-            graph=self.g,
-            config=tf.ConfigProto(
-                intra_op_parallelism_threads=1,
-                inter_op_parallelism_threads=2,
-                gpu_options=tf.GPUOptions(allow_growth=True)))
-        self.variables = ray.experimental.TensorFlowVariables(
-            self.loss, self.sess)
-        self.sess.run(tf.global_variables_initializer())
-
-    def compute_gradients(self, samples):
-        info = {}
-        feed_dict = {
-            self.x: samples["observations"],
-            self.ac: samples["actions"]
-        }
-        self.grads = [g for g in self.grads if g is not None]
-        self.local_steps += 1
-        if self.summarize:
-            loss, grad, summ = self.sess.run(
-                [self.loss, self.grads, self.summary_op], feed_dict=feed_dict)
-            info["summary"] = summ
-        else:
-            loss, grad = self.sess.run(
-                [self.loss, self.grads], feed_dict=feed_dict)
-        info["num_samples"] = len(samples)
-        info["loss"] = loss
-        return grad, info
-
-    def apply_gradients(self, grads):
-        feed_dict = {self.grads[i]: grads[i] for i in range(len(grads))}
-        self.sess.run(self._apply_gradients, feed_dict=feed_dict)
-
-    def get_weights(self):
-        weights = self.variables.get_weights()
-        return weights
-
-    def set_weights(self, weights):
-        self.variables.set_weights(weights)
-
-    def compute(self, ob, *args):
-        action = self.sess.run(self.sample, {self.x: [ob]})
-        return action, None
diff --git a/python/ray/rllib/agents/ddpg/apex.py b/python/ray/rllib/agents/ddpg/apex.py
index c2276d0a9a556..6b3465013da36 100644
--- a/python/ray/rllib/agents/ddpg/apex.py
+++ b/python/ray/rllib/agents/ddpg/apex.py
@@ -3,11 +3,11 @@
 from __future__ import print_function
 
 from ray.rllib.agents.ddpg.ddpg import DDPGAgent, DEFAULT_CONFIG as DDPG_CONFIG
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils import merge_dicts
-from ray.tune.trial import Resources
 
 APEX_DDPG_DEFAULT_CONFIG = merge_dicts(
-    DDPG_CONFIG,
+    DDPG_CONFIG,  # see also the options in ddpg.py, which are also supported
     {
         "optimizer_class": "AsyncReplayOptimizer",
         "optimizer": merge_dicts(
@@ -17,7 +17,7 @@
                 "debug": False
             }),
         "n_step": 3,
-        "gpu": False,
+        "num_gpus": 0,
         "num_workers": 32,
         "buffer_size": 2000000,
         "learning_starts": 50000,
@@ -43,15 +43,7 @@ class ApexDDPGAgent(DDPGAgent):
     _agent_name = "APEX_DDPG"
     _default_config = APEX_DDPG_DEFAULT_CONFIG
 
-    @classmethod
-    def default_resource_request(cls, config):
-        cf = merge_dicts(cls._default_config, config)
-        return Resources(
-            cpu=1 + cf["optimizer"]["num_replay_buffer_shards"],
-            gpu=cf["gpu"] and cf["gpu_fraction"] or 0,
-            extra_cpu=cf["num_cpus_per_worker"] * cf["num_workers"],
-            extra_gpu=cf["num_gpus_per_worker"] * cf["num_workers"])
-
+    @override(DDPGAgent)
     def update_target_if_needed(self):
         # Ape-X updates based on num steps trained, not sampled
         if self.optimizer.num_steps_trained - self.last_target_update_ts > \
diff --git a/python/ray/rllib/agents/ddpg/ddpg.py b/python/ray/rllib/agents/ddpg/ddpg.py
index b475e297a2472..ca0e8087f4644 100644
--- a/python/ray/rllib/agents/ddpg/ddpg.py
+++ b/python/ray/rllib/agents/ddpg/ddpg.py
@@ -5,6 +5,7 @@
 from ray.rllib.agents.agent import with_common_config
 from ray.rllib.agents.dqn.dqn import DQNAgent
 from ray.rllib.agents.ddpg.ddpg_policy_graph import DDPGPolicyGraph
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.schedules import ConstantSchedule, LinearSchedule
 
 OPTIMIZER_SHARED_CONFIGS = [
@@ -13,7 +14,25 @@
     "train_batch_size", "learning_starts"
 ]
 
+# yapf: disable
+# __sphinx_doc_begin__
 DEFAULT_CONFIG = with_common_config({
+    # === Twin Delayed DDPG (TD3) and Soft Actor-Critic (SAC) tricks ===
+    # TD3: https://spinningup.openai.com/en/latest/algorithms/td3.html
+    # twin Q-net
+    "twin_q": False,
+    # delayed policy update
+    "policy_delay": 1,
+    # target policy smoothing
+    # this also forces the use of gaussian instead of OU noise for exploration
+    "smooth_target_policy": False,
+    # gaussian stddev of act noise
+    "act_noise": 0.1,
+    # gaussian stddev of target noise
+    "target_noise": 0.2,
+    # target noise limit (bound)
+    "noise_clip": 0.5,
+
     # === Model ===
     # Hidden layer sizes of the policy network
     "actor_hiddens": [64, 64],
@@ -65,9 +84,11 @@
     "compress_observations": False,
 
     # === Optimization ===
-    # Learning rate for adam optimizer
-    "actor_lr": 1e-4,
-    "critic_lr": 1e-3,
+    # Learning rate for adam optimizer.
+    # Instead of using two optimizers, we use two different loss coefficients
+    "lr": 1e-3,
+    "actor_loss_coeff": 0.1,
+    "critic_loss_coeff": 1.0,
     # If True, use huber loss instead of squared loss for critic network
     # Conventionally, no need to clip gradients if using a huber loss
     "use_huber": False,
@@ -88,16 +109,10 @@
     "train_batch_size": 256,
 
     # === Parallelism ===
-    # Whether to use a GPU for local optimization.
-    "gpu": False,
     # Number of workers for collecting samples with. This only makes sense
     # to increase if your environment is particularly slow to sample, or if
     # you"re using the Async or Ape-X optimizers.
     "num_workers": 0,
-    # Whether to allocate GPUs for workers (if > 0).
-    "num_gpus_per_worker": 0,
-    # Whether to allocate CPUs for workers (if > 0).
-    "num_cpus_per_worker": 1,
     # Optimizer class to use.
     "optimizer_class": "SyncReplayOptimizer",
     # Whether to use a distribution of epsilons across workers for exploration.
@@ -107,6 +122,8 @@
     # Prevent iterations from going lower than this time span
     "min_iter_time_s": 1,
 })
+# __sphinx_doc_end__
+# yapf: enable
 
 
 class DDPGAgent(DQNAgent):
@@ -115,14 +132,22 @@ class DDPGAgent(DQNAgent):
     _default_config = DEFAULT_CONFIG
     _policy_graph = DDPGPolicyGraph
 
+    @override(DQNAgent)
     def _make_exploration_schedule(self, worker_index):
         # Override DQN's schedule to take into account `noise_scale`
         if self.config["per_worker_exploration"]:
             assert self.config["num_workers"] > 1, \
                 "This requires multiple workers"
-            exponent = (
-                1 + worker_index / float(self.config["num_workers"] - 1) * 7)
-            return ConstantSchedule(self.config["noise_scale"] * 0.4**exponent)
+            if worker_index >= 0:
+                exponent = (
+                    1 +
+                    worker_index / float(self.config["num_workers"] - 1) * 7)
+                return ConstantSchedule(
+                    self.config["noise_scale"] * 0.4**exponent)
+            else:
+                # local ev should have zero exploration so that eval rollouts
+                # run properly
+                return ConstantSchedule(0.0)
         else:
             return LinearSchedule(
                 schedule_timesteps=int(self.config["exploration_fraction"] *
diff --git a/python/ray/rllib/agents/ddpg/ddpg_policy_graph.py b/python/ray/rllib/agents/ddpg/ddpg_policy_graph.py
index a6f26885fe308..b8b625734793d 100644
--- a/python/ray/rllib/agents/ddpg/ddpg_policy_graph.py
+++ b/python/ray/rllib/agents/ddpg/ddpg_policy_graph.py
@@ -11,7 +11,9 @@
 from ray.rllib.agents.dqn.dqn_policy_graph import _huber_loss, \
     _minimize_and_clip, _scope_vars, _postprocess_dqn
 from ray.rllib.models import ModelCatalog
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.error import UnsupportedSpaceException
+from ray.rllib.evaluation.policy_graph import PolicyGraph
 from ray.rllib.evaluation.tf_policy_graph import TFPolicyGraph
 
 A_SCOPE = "a_func"
@@ -19,6 +21,8 @@
 P_TARGET_SCOPE = "target_p_func"
 Q_SCOPE = "q_func"
 Q_TARGET_SCOPE = "target_q_func"
+TWIN_Q_SCOPE = "twin_q_func"
+TWIN_Q_TARGET_SCOPE = "twin_target_q_func"
 
 
 class PNetwork(object):
@@ -50,24 +54,47 @@ def __init__(self,
                  stochastic,
                  eps,
                  theta=0.15,
-                 sigma=0.2):
+                 sigma=0.2,
+                 use_gaussian_noise=False,
+                 act_noise=0.1,
+                 is_target=False,
+                 target_noise=0.2,
+                 noise_clip=0.5):
 
         # shape is [None, dim_action]
         deterministic_actions = (
             (high_action - low_action) * p_values + low_action)
 
-        exploration_sample = tf.get_variable(
-            name="ornstein_uhlenbeck",
-            dtype=tf.float32,
-            initializer=low_action.size * [.0],
-            trainable=False)
-        normal_sample = tf.random_normal(
-            shape=[low_action.size], mean=0.0, stddev=1.0)
-        exploration_value = tf.assign_add(
-            exploration_sample,
-            theta * (.0 - exploration_sample) + sigma * normal_sample)
-        stochastic_actions = deterministic_actions + eps * (
-            high_action - low_action) * exploration_value
+        if use_gaussian_noise:
+            if is_target:
+                normal_sample = tf.random_normal(
+                    tf.shape(deterministic_actions), stddev=target_noise)
+                normal_sample = tf.clip_by_value(normal_sample, -noise_clip,
+                                                 noise_clip)
+                stochastic_actions = tf.clip_by_value(
+                    deterministic_actions + normal_sample, low_action,
+                    high_action)
+            else:
+                normal_sample = tf.random_normal(
+                    tf.shape(deterministic_actions), stddev=act_noise)
+                stochastic_actions = tf.clip_by_value(
+                    deterministic_actions + normal_sample, low_action,
+                    high_action)
+        else:
+            exploration_sample = tf.get_variable(
+                name="ornstein_uhlenbeck",
+                dtype=tf.float32,
+                initializer=low_action.size * [.0],
+                trainable=False)
+            normal_sample = tf.random_normal(
+                shape=[low_action.size], mean=0.0, stddev=1.0)
+            exploration_value = tf.assign_add(
+                exploration_sample,
+                theta * (.0 - exploration_sample) + sigma * normal_sample)
+            stochastic_actions = tf.clip_by_value(
+                deterministic_actions +
+                eps * (high_action - low_action) * exploration_value,
+                low_action, high_action)
 
         self.actions = tf.cond(stochastic, lambda: stochastic_actions,
                                lambda: deterministic_actions)
@@ -86,6 +113,7 @@ def __init__(self,
                 q_out, num_outputs=hidden, activation_fn=activation)
         self.value = layers.fully_connected(
             q_out, num_outputs=1, activation_fn=None)
+        self.model = model
 
 
 class ActorCriticLoss(object):
@@ -96,12 +124,21 @@ def __init__(self,
                  importance_weights,
                  rewards,
                  done_mask,
+                 twin_q_t,
+                 twin_q_tp1,
+                 actor_loss_coeff=0.1,
+                 critic_loss_coeff=1.0,
                  gamma=0.99,
                  n_step=1,
                  use_huber=False,
-                 huber_threshold=1.0):
+                 huber_threshold=1.0,
+                 twin_q=False,
+                 policy_delay=1):
 
         q_t_selected = tf.squeeze(q_t, axis=len(q_t.shape) - 1)
+        if twin_q:
+            twin_q_t_selected = tf.squeeze(q_t, axis=len(q_t.shape) - 1)
+            q_tp1 = tf.minimum(q_tp1, twin_q_tp1)
 
         q_tp1_best = tf.squeeze(input=q_tp1, axis=len(q_tp1.shape) - 1)
         q_tp1_best_masked = (1.0 - done_mask) * q_tp1_best
@@ -110,16 +147,36 @@ def __init__(self,
         q_t_selected_target = rewards + gamma**n_step * q_tp1_best_masked
 
         # compute the error (potentially clipped)
-        self.td_error = q_t_selected - tf.stop_gradient(q_t_selected_target)
-        if use_huber:
-            errors = _huber_loss(self.td_error, huber_threshold)
+        if twin_q:
+            td_error = q_t_selected - tf.stop_gradient(q_t_selected_target)
+            twin_td_error = twin_q_t_selected - tf.stop_gradient(
+                q_t_selected_target)
+            self.td_error = td_error + twin_td_error
+            if use_huber:
+                errors = _huber_loss(td_error, huber_threshold) + _huber_loss(
+                    twin_td_error, huber_threshold)
+            else:
+                errors = 0.5 * tf.square(td_error) + 0.5 * tf.square(
+                    twin_td_error)
         else:
-            errors = 0.5 * tf.square(self.td_error)
-
-        self.critic_loss = tf.reduce_mean(importance_weights * errors)
+            self.td_error = (
+                q_t_selected - tf.stop_gradient(q_t_selected_target))
+            if use_huber:
+                errors = _huber_loss(self.td_error, huber_threshold)
+            else:
+                errors = 0.5 * tf.square(self.td_error)
+
+        self.critic_loss = critic_loss_coeff * tf.reduce_mean(
+            importance_weights * errors)
+
+        # for policy gradient, update policy net one time v.s.
+        # update critic net `policy_delay` time(s)
+        global_step = tf.train.get_or_create_global_step()
+        policy_delay_mask = tf.to_float(
+            tf.equal(tf.mod(global_step, policy_delay), 0))
+        self.actor_loss = (-1.0 * actor_loss_coeff * policy_delay_mask *
+                           tf.reduce_mean(q_tp0))
 
-        # for policy gradient
-        self.actor_loss = -1.0 * tf.reduce_mean(q_tp0)
         self.total_loss = self.actor_loss + self.critic_loss
 
 
@@ -136,20 +193,22 @@ def __init__(self, observation_space, action_space, config):
         self.dim_actions = action_space.shape[0]
         self.low_action = action_space.low
         self.high_action = action_space.high
-        self.actor_optimizer = tf.train.AdamOptimizer(
-            learning_rate=config["actor_lr"])
-        self.critic_optimizer = tf.train.AdamOptimizer(
-            learning_rate=config["critic_lr"])
+
+        # create global step for counting the number of update operations
+        self.global_step = tf.train.get_or_create_global_step()
 
         # Action inputs
         self.stochastic = tf.placeholder(tf.bool, (), name="stochastic")
         self.eps = tf.placeholder(tf.float32, (), name="eps")
         self.cur_observations = tf.placeholder(
-            tf.float32, shape=(None, ) + observation_space.shape)
+            tf.float32,
+            shape=(None, ) + observation_space.shape,
+            name="cur_obs")
 
         # Actor: P (policy) network
         with tf.variable_scope(P_SCOPE) as scope:
-            p_values = self._build_p_network(self.cur_observations)
+            p_values = self._build_p_network(self.cur_observations,
+                                             observation_space)
             self.p_func_vars = _scope_vars(scope.name)
 
         # Action outputs
@@ -157,10 +216,13 @@ def __init__(self, observation_space, action_space, config):
             self.output_actions = self._build_action_network(
                 p_values, self.stochastic, self.eps)
 
-        with tf.variable_scope(A_SCOPE, reuse=True):
-            exploration_sample = tf.get_variable(name="ornstein_uhlenbeck")
-            self.reset_noise_op = tf.assign(exploration_sample,
-                                            self.dim_actions * [.0])
+        if self.config["smooth_target_policy"]:
+            self.reset_noise_op = tf.no_op()
+        else:
+            with tf.variable_scope(A_SCOPE, reuse=True):
+                exploration_sample = tf.get_variable(name="ornstein_uhlenbeck")
+                self.reset_noise_op = tf.assign(exploration_sample,
+                                                self.dim_actions * [.0])
 
         # Replay inputs
         self.obs_t = tf.placeholder(
@@ -178,37 +240,63 @@ def __init__(self, observation_space, action_space, config):
 
         # p network evaluation
         with tf.variable_scope(P_SCOPE, reuse=True) as scope:
-            self.p_t = self._build_p_network(self.obs_t)
+            prev_update_ops = set(tf.get_collection(tf.GraphKeys.UPDATE_OPS))
+            self.p_t = self._build_p_network(self.obs_t, observation_space)
+            p_batchnorm_update_ops = list(
+                set(tf.get_collection(tf.GraphKeys.UPDATE_OPS)) -
+                prev_update_ops)
 
         # target p network evaluation
         with tf.variable_scope(P_TARGET_SCOPE) as scope:
-            p_tp1 = self._build_p_network(self.obs_tp1)
+            p_tp1 = self._build_p_network(self.obs_tp1, observation_space)
             target_p_func_vars = _scope_vars(scope.name)
 
         # Action outputs
         with tf.variable_scope(A_SCOPE, reuse=True):
-            deterministic_flag = tf.constant(value=False, dtype=tf.bool)
-            zero_eps = tf.constant(value=.0, dtype=tf.float32)
             output_actions = self._build_action_network(
-                self.p_t, deterministic_flag, zero_eps)
-
+                self.p_t,
+                stochastic=tf.constant(value=False, dtype=tf.bool),
+                eps=.0)
             output_actions_estimated = self._build_action_network(
-                p_tp1, deterministic_flag, zero_eps)
+                p_tp1,
+                stochastic=tf.constant(
+                    value=self.config["smooth_target_policy"], dtype=tf.bool),
+                eps=.0,
+                is_target=True)
 
         # q network evaluation
+        prev_update_ops = set(tf.get_collection(tf.GraphKeys.UPDATE_OPS))
         with tf.variable_scope(Q_SCOPE) as scope:
-            q_t = self._build_q_network(self.obs_t, self.act_t)
+            q_t, model = self._build_q_network(self.obs_t, observation_space,
+                                               self.act_t)
             self.q_func_vars = _scope_vars(scope.name)
         with tf.variable_scope(Q_SCOPE, reuse=True):
-            q_tp0 = self._build_q_network(self.obs_t, output_actions)
+            q_tp0, _ = self._build_q_network(self.obs_t, observation_space,
+                                             output_actions)
+        if self.config["twin_q"]:
+            with tf.variable_scope(TWIN_Q_SCOPE) as scope:
+                twin_q_t, twin_model = self._build_q_network(
+                    self.obs_t, observation_space, self.act_t)
+                self.twin_q_func_vars = _scope_vars(scope.name)
+        q_batchnorm_update_ops = list(
+            set(tf.get_collection(tf.GraphKeys.UPDATE_OPS)) - prev_update_ops)
 
         # target q network evalution
         with tf.variable_scope(Q_TARGET_SCOPE) as scope:
-            q_tp1 = self._build_q_network(self.obs_tp1,
-                                          output_actions_estimated)
+            q_tp1, _ = self._build_q_network(self.obs_tp1, observation_space,
+                                             output_actions_estimated)
             target_q_func_vars = _scope_vars(scope.name)
-
-        self.loss = self._build_actor_critic_loss(q_t, q_tp1, q_tp0)
+        if self.config["twin_q"]:
+            with tf.variable_scope(TWIN_Q_TARGET_SCOPE) as scope:
+                twin_q_tp1, _ = self._build_q_network(
+                    self.obs_tp1, observation_space, output_actions_estimated)
+                twin_target_q_func_vars = _scope_vars(scope.name)
+
+        if self.config["twin_q"]:
+            self.loss = self._build_actor_critic_loss(
+                q_t, q_tp1, q_tp0, twin_q_t=twin_q_t, twin_q_tp1=twin_q_tp1)
+        else:
+            self.loss = self._build_actor_critic_loss(q_t, q_tp1, q_tp0)
 
         if config["l2_reg"] is not None:
             for var in self.p_func_vars:
@@ -219,6 +307,11 @@ def __init__(self, observation_space, action_space, config):
                 if "bias" not in var.name:
                     self.loss.critic_loss += (
                         config["l2_reg"] * 0.5 * tf.nn.l2_loss(var))
+            if self.config["twin_q"]:
+                for var in self.twin_q_func_vars:
+                    if "bias" not in var.name:
+                        self.loss.critic_loss += (
+                            config["l2_reg"] * 0.5 * tf.nn.l2_loss(var))
 
         # update_target_fn will be called periodically to copy Q network to
         # target Q network
@@ -231,6 +324,13 @@ def __init__(self, observation_space, action_space, config):
             update_target_expr.append(
                 var_target.assign(self.tau * var +
                                   (1.0 - self.tau) * var_target))
+        if self.config["twin_q"]:
+            for var, var_target in zip(
+                    sorted(self.twin_q_func_vars, key=lambda v: v.name),
+                    sorted(twin_target_q_func_vars, key=lambda v: v.name)):
+                update_target_expr.append(
+                    var_target.assign(self.tau * var +
+                                      (1.0 - self.tau) * var_target))
         for var, var_target in zip(
                 sorted(self.p_func_vars, key=lambda v: v.name),
                 sorted(target_p_func_vars, key=lambda v: v.name)):
@@ -255,8 +355,9 @@ def __init__(self, observation_space, action_space, config):
             self.sess,
             obs_input=self.cur_observations,
             action_sampler=self.output_actions,
-            loss=self.loss.total_loss,
-            loss_inputs=self.loss_inputs)
+            loss=model.loss() + self.loss.total_loss,
+            loss_inputs=self.loss_inputs,
+            update_ops=q_batchnorm_update_ops + p_batchnorm_update_ops)
         self.sess.run(tf.global_variables_initializer())
 
         # Note that this encompasses both the policy and Q-value networks and
@@ -267,46 +368,31 @@ def __init__(self, observation_space, action_space, config):
         # Hard initial update
         self.update_target(tau=1.0)
 
-    def _build_q_network(self, obs, actions):
-        return QNetwork(
-            ModelCatalog.get_model(obs, 1, self.config["model"]), actions,
-            self.config["critic_hiddens"],
-            self.config["critic_hidden_activation"]).value
-
-    def _build_p_network(self, obs):
-        return PNetwork(
-            ModelCatalog.get_model(obs, 1, self.config["model"]),
-            self.dim_actions, self.config["actor_hiddens"],
-            self.config["actor_hidden_activation"]).action_scores
-
-    def _build_action_network(self, p_values, stochastic, eps):
-        return ActionNetwork(p_values, self.low_action, self.high_action,
-                             stochastic, eps, self.config["exploration_theta"],
-                             self.config["exploration_sigma"]).actions
-
-    def _build_actor_critic_loss(self, q_t, q_tp1, q_tp0):
-        return ActorCriticLoss(
-            q_t, q_tp1, q_tp0, self.importance_weights, self.rew_t,
-            self.done_mask, self.config["gamma"], self.config["n_step"],
-            self.config["use_huber"], self.config["huber_threshold"])
+    @override(TFPolicyGraph)
+    def optimizer(self):
+        return tf.train.AdamOptimizer(learning_rate=self.config["lr"])
 
+    @override(TFPolicyGraph)
     def gradients(self, optimizer):
         if self.config["grad_norm_clipping"] is not None:
             actor_grads_and_vars = _minimize_and_clip(
-                self.actor_optimizer,
+                optimizer,
                 self.loss.actor_loss,
                 var_list=self.p_func_vars,
                 clip_val=self.config["grad_norm_clipping"])
             critic_grads_and_vars = _minimize_and_clip(
-                self.critic_optimizer,
+                optimizer,
                 self.loss.critic_loss,
-                var_list=self.q_func_vars,
+                var_list=self.q_func_vars + self.twin_q_func_vars
+                if self.config["twin_q"] else self.q_func_vars,
                 clip_val=self.config["grad_norm_clipping"])
         else:
-            actor_grads_and_vars = self.actor_optimizer.compute_gradients(
+            actor_grads_and_vars = optimizer.compute_gradients(
                 self.loss.actor_loss, var_list=self.p_func_vars)
-            critic_grads_and_vars = self.critic_optimizer.compute_gradients(
-                self.loss.critic_loss, var_list=self.q_func_vars)
+            critic_grads_and_vars = optimizer.compute_gradients(
+                self.loss.critic_loss,
+                var_list=self.q_func_vars + self.twin_q_func_vars
+                if self.config["twin_q"] else self.q_func_vars)
         actor_grads_and_vars = [(g, v) for (g, v) in actor_grads_and_vars
                                 if g is not None]
         critic_grads_and_vars = [(g, v) for (g, v) in critic_grads_and_vars
@@ -314,20 +400,85 @@ def gradients(self, optimizer):
         grads_and_vars = actor_grads_and_vars + critic_grads_and_vars
         return grads_and_vars
 
+    @override(TFPolicyGraph)
     def extra_compute_action_feed_dict(self):
         return {
             self.stochastic: True,
             self.eps: self.cur_epsilon,
         }
 
+    @override(TFPolicyGraph)
     def extra_compute_grad_fetches(self):
         return {
             "td_error": self.loss.td_error,
         }
 
-    def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
+    @override(PolicyGraph)
+    def postprocess_trajectory(self,
+                               sample_batch,
+                               other_agent_batches=None,
+                               episode=None):
         return _postprocess_dqn(self, sample_batch)
 
+    @override(TFPolicyGraph)
+    def get_weights(self):
+        return self.variables.get_weights()
+
+    @override(TFPolicyGraph)
+    def set_weights(self, weights):
+        self.variables.set_weights(weights)
+
+    @override(PolicyGraph)
+    def get_state(self):
+        return [TFPolicyGraph.get_state(self), self.cur_epsilon]
+
+    @override(PolicyGraph)
+    def set_state(self, state):
+        TFPolicyGraph.set_state(self, state[0])
+        self.set_epsilon(state[1])
+
+    def _build_q_network(self, obs, obs_space, actions):
+        q_net = QNetwork(
+            ModelCatalog.get_model({
+                "obs": obs,
+                "is_training": self._get_is_training_placeholder(),
+            }, obs_space, 1, self.config["model"]), actions,
+            self.config["critic_hiddens"],
+            self.config["critic_hidden_activation"])
+        return q_net.value, q_net.model
+
+    def _build_p_network(self, obs, obs_space):
+        return PNetwork(
+            ModelCatalog.get_model({
+                "obs": obs,
+                "is_training": self._get_is_training_placeholder(),
+            }, obs_space, 1, self.config["model"]), self.dim_actions,
+            self.config["actor_hiddens"],
+            self.config["actor_hidden_activation"]).action_scores
+
+    def _build_action_network(self, p_values, stochastic, eps,
+                              is_target=False):
+        return ActionNetwork(
+            p_values, self.low_action, self.high_action, stochastic, eps,
+            self.config["exploration_theta"], self.config["exploration_sigma"],
+            self.config["smooth_target_policy"], self.config["act_noise"],
+            is_target, self.config["target_noise"],
+            self.config["noise_clip"]).actions
+
+    def _build_actor_critic_loss(self,
+                                 q_t,
+                                 q_tp1,
+                                 q_tp0,
+                                 twin_q_t=None,
+                                 twin_q_tp1=None):
+        return ActorCriticLoss(
+            q_t, q_tp1, q_tp0, self.importance_weights, self.rew_t,
+            self.done_mask, twin_q_t, twin_q_tp1,
+            self.config["actor_loss_coeff"], self.config["critic_loss_coeff"],
+            self.config["gamma"], self.config["n_step"],
+            self.config["use_huber"], self.config["huber_threshold"],
+            self.config["twin_q"])
+
     def compute_td_error(self, obs_t, act_t, rew_t, obs_tp1, done_mask,
                          importance_weights):
         td_err = self.sess.run(
@@ -353,16 +504,3 @@ def update_target(self, tau=None):
 
     def set_epsilon(self, epsilon):
         self.cur_epsilon = epsilon
-
-    def get_weights(self):
-        return self.variables.get_weights()
-
-    def set_weights(self, weights):
-        self.variables.set_weights(weights)
-
-    def get_state(self):
-        return [TFPolicyGraph.get_state(self), self.cur_epsilon]
-
-    def set_state(self, state):
-        TFPolicyGraph.set_state(self, state[0])
-        self.set_epsilon(state[1])
diff --git a/python/ray/rllib/agents/dqn/apex.py b/python/ray/rllib/agents/dqn/apex.py
index e6058b41f9af3..c9b15e0eca792 100644
--- a/python/ray/rllib/agents/dqn/apex.py
+++ b/python/ray/rllib/agents/dqn/apex.py
@@ -4,10 +4,12 @@
 
 from ray.rllib.agents.dqn.dqn import DQNAgent, DEFAULT_CONFIG as DQN_CONFIG
 from ray.rllib.utils import merge_dicts
-from ray.tune.trial import Resources
+from ray.rllib.utils.annotations import override
 
+# yapf: disable
+# __sphinx_doc_begin__
 APEX_DEFAULT_CONFIG = merge_dicts(
-    DQN_CONFIG,
+    DQN_CONFIG,  # see also the options in dqn.py, which are also supported
     {
         "optimizer_class": "AsyncReplayOptimizer",
         "optimizer": merge_dicts(
@@ -17,7 +19,7 @@
                 "debug": False
             }),
         "n_step": 3,
-        "gpu": True,
+        "num_gpus": 1,
         "num_workers": 32,
         "buffer_size": 2000000,
         "learning_starts": 50000,
@@ -30,6 +32,8 @@
         "min_iter_time_s": 30,
     },
 )
+# __sphinx_doc_end__
+# yapf: enable
 
 
 class ApexAgent(DQNAgent):
@@ -42,15 +46,7 @@ class ApexAgent(DQNAgent):
     _agent_name = "APEX"
     _default_config = APEX_DEFAULT_CONFIG
 
-    @classmethod
-    def default_resource_request(cls, config):
-        cf = merge_dicts(cls._default_config, config)
-        return Resources(
-            cpu=1 + cf["optimizer"]["num_replay_buffer_shards"],
-            gpu=cf["gpu"] and cf["gpu_fraction"] or 0,
-            extra_cpu=cf["num_cpus_per_worker"] * cf["num_workers"],
-            extra_gpu=cf["num_gpus_per_worker"] * cf["num_workers"])
-
+    @override(DQNAgent)
     def update_target_if_needed(self):
         # Ape-X updates based on num steps trained, not sampled
         if self.optimizer.num_steps_trained - self.last_target_update_ts > \
diff --git a/python/ray/rllib/agents/dqn/common/wrappers.py b/python/ray/rllib/agents/dqn/common/wrappers.py
deleted file mode 100644
index eb6a6c0d5b5c2..0000000000000
--- a/python/ray/rllib/agents/dqn/common/wrappers.py
+++ /dev/null
@@ -1,19 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-from ray.rllib.models import ModelCatalog
-from ray.rllib.env.atari_wrappers import wrap_deepmind
-
-
-def wrap_dqn(env, options):
-    """Apply a common set of wrappers for DQN."""
-
-    is_atari = hasattr(env.unwrapped, "ale")
-
-    # Override atari default to use the deepmind wrappers.
-    # TODO(ekl) this logic should be pushed to the catalog.
-    if is_atari and "custom_preprocessor" not in options:
-        return wrap_deepmind(env, dim=options.get("dim", 84))
-
-    return ModelCatalog.get_preprocessor_as_wrapper(env, options)
diff --git a/python/ray/rllib/agents/dqn/dqn.py b/python/ray/rllib/agents/dqn/dqn.py
index c945cdbc9fe8e..10e3edd48bd82 100644
--- a/python/ray/rllib/agents/dqn/dqn.py
+++ b/python/ray/rllib/agents/dqn/dqn.py
@@ -7,10 +7,8 @@
 from ray.rllib import optimizers
 from ray.rllib.agents.agent import Agent, with_common_config
 from ray.rllib.agents.dqn.dqn_policy_graph import DQNPolicyGraph
-from ray.rllib.evaluation.metrics import collect_metrics
-from ray.rllib.utils import merge_dicts
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.schedules import ConstantSchedule, LinearSchedule
-from ray.tune.trial import Resources
 
 OPTIMIZER_SHARED_CONFIGS = [
     "buffer_size", "prioritized_replay", "prioritized_replay_alpha",
@@ -20,6 +18,8 @@
     "learning_starts"
 ]
 
+# yapf: disable
+# __sphinx_doc_begin__
 DEFAULT_CONFIG = with_common_config({
     # === Model ===
     # Number of atoms for representing the distribution of return. When
@@ -40,8 +40,6 @@
     "hiddens": [256],
     # N-step Q learning
     "n_step": 1,
-    # Whether to use rllib or deepmind preprocessors
-    "preprocessor_pref": "deepmind",
 
     # === Exploration ===
     # Max num timesteps for annealing schedules. Exploration is annealed from
@@ -96,16 +94,10 @@
     "train_batch_size": 32,
 
     # === Parallelism ===
-    # Whether to use a GPU for local optimization.
-    "gpu": False,
     # Number of workers for collecting samples with. This only makes sense
     # to increase if your environment is particularly slow to sample, or if
     # you"re using the Async or Ape-X optimizers.
     "num_workers": 0,
-    # Whether to allocate GPUs for workers (if > 0).
-    "num_gpus_per_worker": 0,
-    # Whether to allocate CPUs for workers (if > 0).
-    "num_cpus_per_worker": 1,
     # Optimizer class to use.
     "optimizer_class": "SyncReplayOptimizer",
     # Whether to use a distribution of epsilons across workers for exploration.
@@ -115,6 +107,8 @@
     # Prevent iterations from going lower than this time span
     "min_iter_time_s": 1,
 })
+# __sphinx_doc_end__
+# yapf: enable
 
 
 class DQNAgent(Agent):
@@ -124,22 +118,14 @@ class DQNAgent(Agent):
     _default_config = DEFAULT_CONFIG
     _policy_graph = DQNPolicyGraph
 
-    @classmethod
-    def default_resource_request(cls, config):
-        cf = merge_dicts(cls._default_config, config)
-        return Resources(
-            cpu=1,
-            gpu=cf["gpu"] and cf["gpu_fraction"] or 0,
-            extra_cpu=cf["num_cpus_per_worker"] * cf["num_workers"],
-            extra_gpu=cf["num_gpus_per_worker"] * cf["num_workers"])
-
+    @override(Agent)
     def _init(self):
         # Update effective batch size to include n-step
-        adjusted_batch_size = (
-            self.config["sample_batch_size"] + self.config["n_step"] - 1)
+        adjusted_batch_size = max(self.config["sample_batch_size"],
+                                  self.config["n_step"])
         self.config["sample_batch_size"] = adjusted_batch_size
 
-        self.exploration0 = self._make_exploration_schedule(0)
+        self.exploration0 = self._make_exploration_schedule(-1)
         self.explorations = [
             self._make_exploration_schedule(i)
             for i in range(self.config["num_workers"])
@@ -159,12 +145,9 @@ def _init(self):
             self.env_creator, self._policy_graph)
 
         def create_remote_evaluators():
-            return self.make_remote_evaluators(
-                self.env_creator, self._policy_graph,
-                self.config["num_workers"], {
-                    "num_cpus": self.config["num_cpus_per_worker"],
-                    "num_gpus": self.config["num_gpus_per_worker"]
-                })
+            return self.make_remote_evaluators(self.env_creator,
+                                               self._policy_graph,
+                                               self.config["num_workers"])
 
         if self.config["optimizer_class"] != "AsyncReplayOptimizer":
             self.remote_evaluators = create_remote_evaluators()
@@ -178,47 +161,16 @@ def create_remote_evaluators():
         # Create the remote evaluators *after* the replay actors
         if self.remote_evaluators is None:
             self.remote_evaluators = create_remote_evaluators()
-            self.optimizer.set_evaluators(self.remote_evaluators)
+            self.optimizer._set_evaluators(self.remote_evaluators)
 
         self.last_target_update_ts = 0
         self.num_target_updates = 0
 
-    def _make_exploration_schedule(self, worker_index):
-        # Use either a different `eps` per worker, or a linear schedule.
-        if self.config["per_worker_exploration"]:
-            assert self.config["num_workers"] > 1, \
-                "This requires multiple workers"
-            exponent = (
-                1 + worker_index / float(self.config["num_workers"] - 1) * 7)
-            return ConstantSchedule(0.4**exponent)
-        return LinearSchedule(
-            schedule_timesteps=int(self.config["exploration_fraction"] *
-                                   self.config["schedule_max_timesteps"]),
-            initial_p=1.0,
-            final_p=self.config["exploration_final_eps"])
-
-    @property
-    def global_timestep(self):
-        return self.optimizer.num_steps_sampled
-
-    def update_target_if_needed(self):
-        if self.global_timestep - self.last_target_update_ts > \
-                self.config["target_network_update_freq"]:
-            self.local_evaluator.foreach_trainable_policy(
-                lambda p, _: p.update_target())
-            self.last_target_update_ts = self.global_timestep
-            self.num_target_updates += 1
-
+    @override(Agent)
     def _train(self):
         start_timestep = self.global_timestep
 
-        start = time.time()
-        while (self.global_timestep - start_timestep <
-               self.config["timesteps_per_iteration"]
-               ) or time.time() - start < self.config["min_iter_time_s"]:
-            self.optimizer.step()
-            self.update_target_if_needed()
-
+        # Update worker explorations
         exp_vals = [self.exploration0.value(self.global_timestep)]
         self.local_evaluator.foreach_trainable_policy(
             lambda p, _: p.set_epsilon(exp_vals[0]))
@@ -228,14 +180,23 @@ def _train(self):
                 lambda p, _: p.set_epsilon(exp_val))
             exp_vals.append(exp_val)
 
+        # Do optimization steps
+        start = time.time()
+        while (self.global_timestep - start_timestep <
+               self.config["timesteps_per_iteration"]
+               ) or time.time() - start < self.config["min_iter_time_s"]:
+            self.optimizer.step()
+            self.update_target_if_needed()
+
         if self.config["per_worker_exploration"]:
             # Only collect metrics from the third of workers with lowest eps
-            result = collect_metrics(
-                self.local_evaluator,
-                self.remote_evaluators[-len(self.remote_evaluators) // 3:])
+            result = self.optimizer.collect_metrics(
+                timeout_seconds=self.config["collect_metrics_timeout"],
+                selected_evaluators=self.remote_evaluators[
+                    -len(self.remote_evaluators) // 3:])
         else:
-            result = collect_metrics(self.local_evaluator,
-                                     self.remote_evaluators)
+            result = self.optimizer.collect_metrics(
+                timeout_seconds=self.config["collect_metrics_timeout"])
 
         result.update(
             timesteps_this_iter=self.global_timestep - start_timestep,
@@ -246,6 +207,38 @@ def _train(self):
             }, **self.optimizer.stats()))
         return result
 
+    def update_target_if_needed(self):
+        if self.global_timestep - self.last_target_update_ts > \
+                self.config["target_network_update_freq"]:
+            self.local_evaluator.foreach_trainable_policy(
+                lambda p, _: p.update_target())
+            self.last_target_update_ts = self.global_timestep
+            self.num_target_updates += 1
+
+    @property
+    def global_timestep(self):
+        return self.optimizer.num_steps_sampled
+
+    def _make_exploration_schedule(self, worker_index):
+        # Use either a different `eps` per worker, or a linear schedule.
+        if self.config["per_worker_exploration"]:
+            assert self.config["num_workers"] > 1, \
+                "This requires multiple workers"
+            if worker_index >= 0:
+                exponent = (
+                    1 +
+                    worker_index / float(self.config["num_workers"] - 1) * 7)
+                return ConstantSchedule(0.4**exponent)
+            else:
+                # local ev should have zero exploration so that eval rollouts
+                # run properly
+                return ConstantSchedule(0.0)
+        return LinearSchedule(
+            schedule_timesteps=int(self.config["exploration_fraction"] *
+                                   self.config["schedule_max_timesteps"]),
+            initial_p=1.0,
+            final_p=self.config["exploration_final_eps"])
+
     def __getstate__(self):
         state = Agent.__getstate__(self)
         state.update({
diff --git a/python/ray/rllib/agents/dqn/dqn_policy_graph.py b/python/ray/rllib/agents/dqn/dqn_policy_graph.py
index a2e8c8022c7b1..625e577fff164 100644
--- a/python/ray/rllib/agents/dqn/dqn_policy_graph.py
+++ b/python/ray/rllib/agents/dqn/dqn_policy_graph.py
@@ -10,7 +10,9 @@
 import ray
 from ray.rllib.models import ModelCatalog
 from ray.rllib.evaluation.sample_batch import SampleBatch
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.error import UnsupportedSpaceException
+from ray.rllib.evaluation.policy_graph import PolicyGraph
 from ray.rllib.evaluation.tf_policy_graph import TFPolicyGraph
 
 Q_SCOPE = "q_func"
@@ -28,17 +30,23 @@ def __init__(self,
                  v_min=-10.0,
                  v_max=10.0,
                  sigma0=0.5):
+        self.model = model
         with tf.variable_scope("action_value"):
-            action_out = model.last_layer
-            for i in range(len(hiddens)):
-                if use_noisy:
-                    action_out = self.noisy_layer("hidden_%d" % i, action_out,
-                                                  hiddens[i], sigma0)
-                else:
-                    action_out = layers.fully_connected(
-                        action_out,
-                        num_outputs=hiddens[i],
-                        activation_fn=tf.nn.relu)
+            if hiddens:
+                action_out = model.last_layer
+                for i in range(len(hiddens)):
+                    if use_noisy:
+                        action_out = self.noisy_layer(
+                            "hidden_%d" % i, action_out, hiddens[i], sigma0)
+                    else:
+                        action_out = layers.fully_connected(
+                            action_out,
+                            num_outputs=hiddens[i],
+                            activation_fn=tf.nn.relu)
+            else:
+                # Avoid postprocessing the outputs. This enables custom models
+                # to be used for parametric action DQN.
+                action_out = model.outputs
             if use_noisy:
                 action_scores = self.noisy_layer(
                     "output",
@@ -46,11 +54,13 @@ def __init__(self,
                     num_actions * num_atoms,
                     sigma0,
                     non_linear=False)
-            else:
+            elif hiddens:
                 action_scores = layers.fully_connected(
                     action_out,
                     num_outputs=num_actions * num_atoms,
                     activation_fn=None)
+            else:
+                action_scores = model.outputs
             if num_atoms > 1:
                 # Distributional Q-learning uses a discrete support z
                 # to represent the action value distribution
@@ -106,7 +116,7 @@ def __init__(self,
                 self.logits = support_logits_per_action
                 self.dist = support_prob_per_action
             else:
-                action_scores_mean = tf.reduce_mean(action_scores, 1)
+                action_scores_mean = _reduce_mean_ignore_inf(action_scores, 1)
                 action_scores_centered = action_scores - tf.expand_dims(
                     action_scores_mean, 1)
                 self.value = state_score + action_scores_centered
@@ -175,11 +185,15 @@ class QValuePolicy(object):
     def __init__(self, q_values, observations, num_actions, stochastic, eps):
         deterministic_actions = tf.argmax(q_values, axis=1)
         batch_size = tf.shape(observations)[0]
-        random_actions = tf.random_uniform(
-            tf.stack([batch_size]),
-            minval=0,
-            maxval=num_actions,
-            dtype=tf.int64)
+
+        # Special case masked out actions (q_value ~= -inf) so that we don't
+        # even consider them for exploration.
+        random_valid_action_logits = tf.where(
+            tf.equal(q_values, tf.float32.min),
+            tf.ones_like(q_values) * tf.float32.min, tf.ones_like(q_values))
+        random_actions = tf.squeeze(
+            tf.multinomial(random_valid_action_logits, 1), axis=1)
+
         chose_random = tf.random_uniform(
             tf.stack([batch_size]), minval=0, maxval=1, dtype=tf.float32) < eps
         stochastic_actions = tf.where(chose_random, random_actions,
@@ -241,6 +255,10 @@ def __init__(self,
             self.td_error = tf.nn.softmax_cross_entropy_with_logits(
                 labels=m, logits=q_logits_t_selected)
             self.loss = tf.reduce_mean(self.td_error * importance_weights)
+            self.stats = {
+                # TODO: better Q stats for dist dqn
+                "mean_td_error": tf.reduce_mean(self.td_error),
+            }
         else:
             q_tp1_best_masked = (1.0 - done_mask) * q_tp1_best
 
@@ -252,6 +270,12 @@ def __init__(self,
                 q_t_selected - tf.stop_gradient(q_t_selected_target))
             self.loss = tf.reduce_mean(
                 importance_weights * _huber_loss(self.td_error))
+            self.stats = {
+                "mean_q": tf.reduce_mean(q_t_selected),
+                "min_q": tf.reduce_min(q_t_selected),
+                "max_q": tf.reduce_max(q_t_selected),
+                "mean_td_error": tf.reduce_mean(self.td_error),
+            }
 
 
 class DQNPolicyGraph(TFPolicyGraph):
@@ -274,8 +298,8 @@ def __init__(self, observation_space, action_space, config):
 
         # Action Q network
         with tf.variable_scope(Q_SCOPE) as scope:
-            q_values, q_logits, q_dist = self._build_q_network(
-                self.cur_observations)
+            q_values, q_logits, q_dist, _ = self._build_q_network(
+                self.cur_observations, observation_space)
             self.q_func_vars = _scope_vars(scope.name)
 
         # Action outputs
@@ -294,12 +318,17 @@ def __init__(self, observation_space, action_space, config):
 
         # q network evaluation
         with tf.variable_scope(Q_SCOPE, reuse=True):
-            q_t, q_logits_t, q_dist_t = self._build_q_network(self.obs_t)
+            prev_update_ops = set(tf.get_collection(tf.GraphKeys.UPDATE_OPS))
+            q_t, q_logits_t, q_dist_t, model = self._build_q_network(
+                self.obs_t, observation_space)
+            q_batchnorm_update_ops = list(
+                set(tf.get_collection(tf.GraphKeys.UPDATE_OPS)) -
+                prev_update_ops)
 
         # target q network evalution
         with tf.variable_scope(Q_TARGET_SCOPE) as scope:
-            q_tp1, q_logits_tp1, q_dist_tp1 = self._build_q_network(
-                self.obs_tp1)
+            q_tp1, q_logits_tp1, q_dist_tp1, _ = self._build_q_network(
+                self.obs_tp1, observation_space)
             self.target_q_func_vars = _scope_vars(scope.name)
 
         # q scores for actions which we know were selected in the given state.
@@ -312,8 +341,8 @@ def __init__(self, observation_space, action_space, config):
         if config["double_q"]:
             with tf.variable_scope(Q_SCOPE, reuse=True):
                 q_tp1_using_online_net, q_logits_tp1_using_online_net, \
-                    q_dist_tp1_using_online_net = self._build_q_network(
-                        self.obs_tp1)
+                    q_dist_tp1_using_online_net, _ = self._build_q_network(
+                        self.obs_tp1, observation_space)
             q_tp1_best_using_online_net = tf.argmax(q_tp1_using_online_net, 1)
             q_tp1_best_one_hot_selection = tf.one_hot(
                 q_tp1_best_using_online_net, self.num_actions)
@@ -358,35 +387,18 @@ def __init__(self, observation_space, action_space, config):
             self.sess,
             obs_input=self.cur_observations,
             action_sampler=self.output_actions,
-            loss=self.loss.loss,
-            loss_inputs=self.loss_inputs)
+            loss=model.loss() + self.loss.loss,
+            loss_inputs=self.loss_inputs,
+            update_ops=q_batchnorm_update_ops)
         self.sess.run(tf.global_variables_initializer())
 
-    def _build_q_network(self, obs):
-        qnet = QNetwork(
-            ModelCatalog.get_model(obs, 1, self.config["model"]),
-            self.num_actions, self.config["dueling"], self.config["hiddens"],
-            self.config["noisy"], self.config["num_atoms"],
-            self.config["v_min"], self.config["v_max"], self.config["sigma0"])
-        return qnet.value, qnet.logits, qnet.dist
-
-    def _build_q_value_policy(self, q_values):
-        return QValuePolicy(q_values, self.cur_observations, self.num_actions,
-                            self.stochastic, self.eps).action
-
-    def _build_q_loss(self, q_t_selected, q_logits_t_selected, q_tp1_best,
-                      q_dist_tp1_best):
-        return QLoss(q_t_selected, q_logits_t_selected, q_tp1_best,
-                     q_dist_tp1_best, self.importance_weights, self.rew_t,
-                     self.done_mask, self.config["gamma"],
-                     self.config["n_step"], self.config["num_atoms"],
-                     self.config["v_min"], self.config["v_max"])
-
+    @override(TFPolicyGraph)
     def optimizer(self):
         return tf.train.AdamOptimizer(
             learning_rate=self.config["lr"],
             epsilon=self.config["adam_epsilon"])
 
+    @override(TFPolicyGraph)
     def gradients(self, optimizer):
         if self.config["grad_norm_clipping"] is not None:
             grads_and_vars = _minimize_and_clip(
@@ -400,20 +412,36 @@ def gradients(self, optimizer):
         grads_and_vars = [(g, v) for (g, v) in grads_and_vars if g is not None]
         return grads_and_vars
 
+    @override(TFPolicyGraph)
     def extra_compute_action_feed_dict(self):
         return {
             self.stochastic: True,
             self.eps: self.cur_epsilon,
         }
 
+    @override(TFPolicyGraph)
     def extra_compute_grad_fetches(self):
         return {
             "td_error": self.loss.td_error,
+            "stats": self.loss.stats,
         }
 
-    def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
+    @override(PolicyGraph)
+    def postprocess_trajectory(self,
+                               sample_batch,
+                               other_agent_batches=None,
+                               episode=None):
         return _postprocess_dqn(self, sample_batch)
 
+    @override(PolicyGraph)
+    def get_state(self):
+        return [TFPolicyGraph.get_state(self), self.cur_epsilon]
+
+    @override(PolicyGraph)
+    def set_state(self, state):
+        TFPolicyGraph.set_state(self, state[0])
+        self.set_epsilon(state[1])
+
     def compute_td_error(self, obs_t, act_t, rew_t, obs_tp1, done_mask,
                          importance_weights):
         td_err = self.sess.run(
@@ -434,15 +462,31 @@ def update_target(self):
     def set_epsilon(self, epsilon):
         self.cur_epsilon = epsilon
 
-    def get_state(self):
-        return [TFPolicyGraph.get_state(self), self.cur_epsilon]
+    def _build_q_network(self, obs, space):
+        qnet = QNetwork(
+            ModelCatalog.get_model({
+                "obs": obs,
+                "is_training": self._get_is_training_placeholder(),
+            }, space, self.num_actions, self.config["model"]),
+            self.num_actions, self.config["dueling"], self.config["hiddens"],
+            self.config["noisy"], self.config["num_atoms"],
+            self.config["v_min"], self.config["v_max"], self.config["sigma0"])
+        return qnet.value, qnet.logits, qnet.dist, qnet.model
 
-    def set_state(self, state):
-        TFPolicyGraph.set_state(self, state[0])
-        self.set_epsilon(state[1])
+    def _build_q_value_policy(self, q_values):
+        return QValuePolicy(q_values, self.cur_observations, self.num_actions,
+                            self.stochastic, self.eps).action
+
+    def _build_q_loss(self, q_t_selected, q_logits_t_selected, q_tp1_best,
+                      q_dist_tp1_best):
+        return QLoss(q_t_selected, q_logits_t_selected, q_tp1_best,
+                     q_dist_tp1_best, self.importance_weights, self.rew_t,
+                     self.done_mask, self.config["gamma"],
+                     self.config["n_step"], self.config["num_atoms"],
+                     self.config["v_min"], self.config["v_max"])
 
 
-def adjust_nstep(n_step, gamma, obs, actions, rewards, new_obs, dones):
+def _adjust_nstep(n_step, gamma, obs, actions, rewards, new_obs, dones):
     """Rewrites the given trajectory fragments to encode n-step rewards.
 
     reward[i] = (
@@ -475,9 +519,9 @@ def _postprocess_dqn(policy_graph, sample_batch):
 
     # N-step Q adjustments
     if policy_graph.config["n_step"] > 1:
-        adjust_nstep(policy_graph.config["n_step"],
-                     policy_graph.config["gamma"], obs, actions, rewards,
-                     new_obs, dones)
+        _adjust_nstep(policy_graph.config["n_step"],
+                      policy_graph.config["gamma"], obs, actions, rewards,
+                      new_obs, dones)
 
     batch = SampleBatch({
         "obs": obs,
@@ -500,6 +544,14 @@ def _postprocess_dqn(policy_graph, sample_batch):
     return batch
 
 
+def _reduce_mean_ignore_inf(x, axis):
+    """Same as tf.reduce_mean() but ignores -inf values."""
+    mask = tf.not_equal(x, tf.float32.min)
+    x_zeroed = tf.where(mask, x, tf.zeros_like(x))
+    return (tf.reduce_sum(x_zeroed, axis) / tf.reduce_sum(
+        tf.cast(mask, tf.float32), axis))
+
+
 def _huber_loss(x, delta=1.0):
     """Reference: https://en.wikipedia.org/wiki/Huber_loss"""
     return tf.where(
diff --git a/python/ray/rllib/agents/es/es.py b/python/ray/rllib/agents/es/es.py
index 1ce219b7c0ab1..4aa4a86aac889 100644
--- a/python/ray/rllib/agents/es/es.py
+++ b/python/ray/rllib/agents/es/es.py
@@ -6,25 +6,29 @@
 from __future__ import print_function
 
 from collections import namedtuple
+import logging
 import numpy as np
 import time
 
 import ray
-from ray.rllib.agents import Agent
-from ray.tune.trial import Resources
+from ray.rllib.agents import Agent, with_common_config
 
 from ray.rllib.agents.es import optimizers
 from ray.rllib.agents.es import policies
-from ray.rllib.agents.es import tabular_logger as tlogger
 from ray.rllib.agents.es import utils
-from ray.rllib.utils import merge_dicts
+from ray.rllib.utils.annotations import override
+from ray.rllib.utils import FilterManager
+
+logger = logging.getLogger(__name__)
 
 Result = namedtuple("Result", [
     "noise_indices", "noisy_returns", "sign_noisy_returns", "noisy_lengths",
     "eval_returns", "eval_lengths"
 ])
 
-DEFAULT_CONFIG = {
+# yapf: disable
+# __sphinx_doc_begin__
+DEFAULT_CONFIG = with_common_config({
     "l2_coeff": 0.005,
     "noise_stdev": 0.02,
     "episodes_per_batch": 1000,
@@ -36,9 +40,9 @@
     "observation_filter": "MeanStdFilter",
     "noise_size": 250000000,
     "report_length": 10,
-    "env": None,
-    "env_config": {},
-}
+})
+# __sphinx_doc_end__
+# yapf: enable
 
 
 @ray.remote
@@ -76,12 +80,30 @@ def __init__(self,
 
         self.env = env_creator(config["env_config"])
         from ray.rllib import models
-        self.preprocessor = models.ModelCatalog.get_preprocessor(self.env)
+        self.preprocessor = models.ModelCatalog.get_preprocessor(
+            self.env, config["model"])
 
         self.sess = utils.make_session(single_threaded=True)
         self.policy = policies.GenericPolicy(
-            self.sess, self.env.action_space, self.preprocessor,
-            config["observation_filter"], **policy_params)
+            self.sess, self.env.action_space, self.env.observation_space,
+            self.preprocessor, config["observation_filter"], config["model"],
+            **policy_params)
+
+    @property
+    def filters(self):
+        return {"default": self.policy.get_filter()}
+
+    def sync_filters(self, new_filters):
+        for k in self.filters:
+            self.filters[k].sync(new_filters[k])
+
+    def get_filters(self, flush_after=False):
+        return_filters = {}
+        for k, f in self.filters.items():
+            return_filters[k] = f.as_serializable()
+            if flush_after:
+                f.clear_buffer()
+        return return_filters
 
     def rollout(self, timestep_limit, add_noise=True):
         rollout_rewards, rollout_length = policies.rollout(
@@ -146,11 +168,7 @@ class ESAgent(Agent):
     _agent_name = "ES"
     _default_config = DEFAULT_CONFIG
 
-    @classmethod
-    def default_resource_request(cls, config):
-        cf = merge_dicts(cls._default_config, config)
-        return Resources(cpu=1, gpu=0, extra_cpu=cf["num_workers"])
-
+    @override(Agent)
     def _init(self):
         policy_params = {"action_noise_std": 0.01}
 
@@ -160,18 +178,19 @@ def _init(self):
 
         self.sess = utils.make_session(single_threaded=False)
         self.policy = policies.GenericPolicy(
-            self.sess, env.action_space, preprocessor,
-            self.config["observation_filter"], **policy_params)
+            self.sess, env.action_space, env.observation_space, preprocessor,
+            self.config["observation_filter"], self.config["model"],
+            **policy_params)
         self.optimizer = optimizers.Adam(self.policy, self.config["stepsize"])
         self.report_length = self.config["report_length"]
 
         # Create the shared noise table.
-        print("Creating shared noise table.")
+        logger.info("Creating shared noise table.")
         noise_id = create_shared_noise.remote(self.config["noise_size"])
         self.noise = SharedNoiseTable(ray.get(noise_id))
 
         # Create the actors.
-        print("Creating actors.")
+        logger.info("Creating actors.")
         self.workers = [
             Worker.remote(self.config, policy_params, self.env_creator,
                           noise_id) for _ in range(self.config["num_workers"])
@@ -181,26 +200,7 @@ def _init(self):
         self.reward_list = []
         self.tstart = time.time()
 
-    def _collect_results(self, theta_id, min_episodes, min_timesteps):
-        num_episodes, num_timesteps = 0, 0
-        results = []
-        while num_episodes < min_episodes or num_timesteps < min_timesteps:
-            print("Collected {} episodes {} timesteps so far this iter".format(
-                num_episodes, num_timesteps))
-            rollout_ids = [
-                worker.do_rollouts.remote(theta_id) for worker in self.workers
-            ]
-            # Get the results of the rollouts.
-            for result in ray.get(rollout_ids):
-                results.append(result)
-                # Update the number of episodes and the number of timesteps
-                # keeping in mind that result.noisy_lengths is a list of lists,
-                # where the inner lists have length 2.
-                num_episodes += sum(len(pair) for pair in result.noisy_lengths)
-                num_timesteps += sum(
-                    sum(pair) for pair in result.noisy_lengths)
-        return results, num_episodes, num_timesteps
-
+    @override(Agent)
     def _train(self):
         config = self.config
 
@@ -266,20 +266,10 @@ def _train(self):
         if len(all_eval_returns) > 0:
             self.reward_list.append(np.mean(eval_returns))
 
-        tlogger.record_tabular("EvalEpRewStd", eval_returns.std())
-        tlogger.record_tabular("EvalEpLenMean", eval_lengths.mean())
-
-        tlogger.record_tabular("EpRewMean", noisy_returns.mean())
-        tlogger.record_tabular("EpRewStd", noisy_returns.std())
-        tlogger.record_tabular("EpLenMean", noisy_lengths.mean())
-
-        tlogger.record_tabular("Norm", float(np.square(theta).sum()))
-        tlogger.record_tabular("GradNorm", float(np.square(g).sum()))
-        tlogger.record_tabular("UpdateRatio", float(update_ratio))
-
-        tlogger.record_tabular("EpisodesThisIter", noisy_lengths.size)
-        tlogger.record_tabular("EpisodesSoFar", self.episodes_so_far)
-        tlogger.dump_tabular()
+        # Now sync the filters
+        FilterManager.synchronize({
+            "default": self.policy.get_filter()
+        }, self.workers)
 
         info = {
             "weights_norm": np.square(theta).sum(),
@@ -298,20 +288,49 @@ def _train(self):
 
         return result
 
+    @override(Agent)
+    def compute_action(self, observation):
+        return self.policy.compute(observation, update=False)[0]
+
+    @override(Agent)
     def _stop(self):
         # workaround for https://github.com/ray-project/ray/issues/1516
         for w in self.workers:
             w.__ray_terminate__.remote()
 
+    def _collect_results(self, theta_id, min_episodes, min_timesteps):
+        num_episodes, num_timesteps = 0, 0
+        results = []
+        while num_episodes < min_episodes or num_timesteps < min_timesteps:
+            logger.info(
+                "Collected {} episodes {} timesteps so far this iter".format(
+                    num_episodes, num_timesteps))
+            rollout_ids = [
+                worker.do_rollouts.remote(theta_id) for worker in self.workers
+            ]
+            # Get the results of the rollouts.
+            for result in ray.get(rollout_ids):
+                results.append(result)
+                # Update the number of episodes and the number of timesteps
+                # keeping in mind that result.noisy_lengths is a list of lists,
+                # where the inner lists have length 2.
+                num_episodes += sum(len(pair) for pair in result.noisy_lengths)
+                num_timesteps += sum(
+                    sum(pair) for pair in result.noisy_lengths)
+
+        return results, num_episodes, num_timesteps
+
     def __getstate__(self):
         return {
             "weights": self.policy.get_weights(),
+            "filter": self.policy.get_filter(),
             "episodes_so_far": self.episodes_so_far,
         }
 
     def __setstate__(self, state):
-        self.policy.set_weights(state["weights"])
         self.episodes_so_far = state["episodes_so_far"]
-
-    def compute_action(self, observation):
-        return self.policy.compute(observation, update=False)[0]
+        self.policy.set_weights(state["weights"])
+        self.policy.set_filter(state["filter"])
+        FilterManager.synchronize({
+            "default": self.policy.get_filter()
+        }, self.workers)
diff --git a/python/ray/rllib/agents/es/policies.py b/python/ray/rllib/agents/es/policies.py
index d62fee43c4c57..cf2da630e0866 100644
--- a/python/ray/rllib/agents/es/policies.py
+++ b/python/ray/rllib/agents/es/policies.py
@@ -10,6 +10,7 @@
 import tensorflow as tf
 
 import ray
+from ray.rllib.evaluation.sampler import _unbatch_tuple_actions
 from ray.rllib.models import ModelCatalog
 from ray.rllib.utils.filter import get_filter
 
@@ -38,8 +39,8 @@ def rollout(policy, env, timestep_limit=None, add_noise=False):
 
 
 class GenericPolicy(object):
-    def __init__(self, sess, action_space, preprocessor, observation_filter,
-                 action_noise_std):
+    def __init__(self, sess, action_space, obs_space, preprocessor,
+                 observation_filter, model_options, action_noise_std):
         self.sess = sess
         self.action_space = action_space
         self.action_noise_std = action_noise_std
@@ -51,8 +52,10 @@ def __init__(self, sess, action_space, preprocessor, observation_filter,
 
         # Policy network.
         dist_class, dist_dim = ModelCatalog.get_action_dist(
-            self.action_space, dist_type="deterministic")
-        model = ModelCatalog.get_model(self.inputs, dist_dim)
+            self.action_space, model_options, dist_type="deterministic")
+        model = ModelCatalog.get_model({
+            "obs": self.inputs
+        }, obs_space, dist_dim, model_options)
         dist = dist_class(model.outputs)
         self.sampler = dist.sample()
 
@@ -69,6 +72,7 @@ def compute(self, observation, add_noise=False, update=True):
         observation = self.observation_filter(observation[None], update=update)
         action = self.sess.run(
             self.sampler, feed_dict={self.inputs: observation})
+        action = _unbatch_tuple_actions(action)
         if add_noise and isinstance(self.action_space, gym.spaces.Box):
             action += np.random.randn(*action.shape) * self.action_noise_std
         return action
@@ -78,3 +82,9 @@ def set_weights(self, x):
 
     def get_weights(self):
         return self.variables.get_flat()
+
+    def get_filter(self):
+        return self.observation_filter
+
+    def set_filter(self, observation_filter):
+        self.observation_filter = observation_filter
diff --git a/python/ray/rllib/agents/es/tabular_logger.py b/python/ray/rllib/agents/es/tabular_logger.py
deleted file mode 100644
index 1463e59e07046..0000000000000
--- a/python/ray/rllib/agents/es/tabular_logger.py
+++ /dev/null
@@ -1,229 +0,0 @@
-# Code in this file is copied and adapted from
-# https://github.com/openai/evolution-strategies-starter.
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-from collections import OrderedDict
-import os
-import sys
-import time
-
-import tensorflow as tf
-from tensorflow.core.util import event_pb2
-from tensorflow.python import pywrap_tensorflow
-from tensorflow.python.util import compat
-
-DEBUG = 10
-INFO = 20
-WARN = 30
-ERROR = 40
-
-DISABLED = 50
-
-
-class TbWriter(object):
-    """Based on SummaryWriter, but changed to allow for a different prefix."""
-
-    def __init__(self, dir, prefix):
-        self.dir = dir
-        # Start at 1, because EvWriter automatically generates an object with
-        # step = 0.
-        self.step = 1
-        self.evwriter = pywrap_tensorflow.EventsWriter(
-            compat.as_bytes(os.path.join(dir, prefix)))
-
-    def write_values(self, key2val):
-        summary = tf.Summary(value=[
-            tf.Summary.Value(tag=k, simple_value=float(v))
-            for (k, v) in key2val.items()
-        ])
-        event = event_pb2.Event(wall_time=time.time(), summary=summary)
-        event.step = self.step
-        self.evwriter.WriteEvent(event)
-        self.evwriter.Flush()
-        self.step += 1
-
-    def close(self):
-        self.evwriter.Close()
-
-
-# API
-
-
-def start(dir):
-    if _Logger.CURRENT is not _Logger.DEFAULT:
-        sys.stderr.write("WARNING: You asked to start logging (dir=%s), but "
-                         "you never stopped the previous logger (dir=%s)."
-                         "\n" % (dir, _Logger.CURRENT.dir))
-    _Logger.CURRENT = _Logger(dir=dir)
-
-
-def stop():
-    if _Logger.CURRENT is _Logger.DEFAULT:
-        sys.stderr.write("WARNING: You asked to stop logging, but you never "
-                         "started any previous logger."
-                         "\n" % (dir, _Logger.CURRENT.dir))
-        return
-    _Logger.CURRENT.close()
-    _Logger.CURRENT = _Logger.DEFAULT
-
-
-def record_tabular(key, val):
-    """Log a value of some diagnostic.
-
-    Call this once for each diagnostic quantity, each iteration.
-    """
-    _Logger.CURRENT.record_tabular(key, val)
-
-
-def dump_tabular():
-    """Write all of the diagnostics from the current iteration."""
-    _Logger.CURRENT.dump_tabular()
-
-
-def log(*args, **kwargs):
-    """Write the sequence of args, with no separators.
-
-    This is written to the console and output files (if you've configured an
-    output file).
-    """
-    level = kwargs['level'] if 'level' in kwargs else INFO
-    _Logger.CURRENT.log(*args, level=level)
-
-
-def debug(*args):
-    log(*args, level=DEBUG)
-
-
-def info(*args):
-    log(*args, level=INFO)
-
-
-def warn(*args):
-    log(*args, level=WARN)
-
-
-def error(*args):
-    log(*args, level=ERROR)
-
-
-def set_level(level):
-    """
-    Set logging threshold on current logger.
-    """
-    _Logger.CURRENT.set_level(level)
-
-
-def get_dir():
-    """
-    Get directory that log files are being written to.
-    will be None if there is no output directory (i.e., if you didn't call
-    start)
-    """
-    return _Logger.CURRENT.get_dir()
-
-
-def get_expt_dir():
-    sys.stderr.write("get_expt_dir() is Deprecated. Switch to get_dir()\n")
-    return get_dir()
-
-
-# Backend
-
-
-class _Logger(object):
-    # A logger with no output files. (See right below class definition) so that
-    # you can still log to the terminal without setting up any output files.
-    DEFAULT = None
-    # Current logger being used by the free functions above.
-    CURRENT = None
-
-    def __init__(self, dir=None):
-        self.name2val = OrderedDict()  # Values this iteration.
-        self.level = INFO
-        self.dir = dir
-        self.text_outputs = [sys.stdout]
-        if dir is not None:
-            os.makedirs(dir, exist_ok=True)
-            self.text_outputs.append(open(os.path.join(dir, "log.txt"), "w"))
-            self.tbwriter = TbWriter(dir=dir, prefix="events")
-        else:
-            self.tbwriter = None
-
-    # Logging API, forwarded
-
-    def record_tabular(self, key, val):
-        self.name2val[key] = val
-
-    def dump_tabular(self):
-        # Create strings for printing.
-        key2str = OrderedDict()
-        for (key, val) in self.name2val.items():
-            if hasattr(val, "__float__"):
-                valstr = "%-8.3g" % val
-            else:
-                valstr = val
-            key2str[self._truncate(key)] = self._truncate(valstr)
-        keywidth = max(map(len, key2str.keys()))
-        valwidth = max(map(len, key2str.values()))
-        # Write to all text outputs
-        self._write_text("-" * (keywidth + valwidth + 7), "\n")
-        for (key, val) in key2str.items():
-            self._write_text("| ", key, " " * (keywidth - len(key)), " | ",
-                             val, " " * (valwidth - len(val)), " |\n")
-        self._write_text("-" * (keywidth + valwidth + 7), "\n")
-        for f in self.text_outputs:
-            try:
-                f.flush()
-            except OSError:
-                sys.stderr.write('Warning! OSError when flushing.\n')
-        # Write to tensorboard
-        if self.tbwriter is not None:
-            self.tbwriter.write_values(self.name2val)
-            self.name2val.clear()
-
-    def log(self, *args, **kwargs):
-        level = kwargs['level'] if 'level' in kwargs else INFO
-        if self.level <= level:
-            self._do_log(*args)
-
-    # Configuration
-
-    def set_level(self, level):
-        self.level = level
-
-    def get_dir(self):
-        return self.dir
-
-    def close(self):
-        for f in self.text_outputs[1:]:
-            f.close()
-        if self.tbwriter:
-            self.tbwriter.close()
-
-    # Misc
-
-    def _do_log(self, *args):
-        self._write_text(*args + ('\n', ))
-        for f in self.text_outputs:
-            try:
-                f.flush()
-            except OSError:
-                print('Warning! OSError when flushing.')
-
-    def _write_text(self, *strings):
-        for f in self.text_outputs:
-            for string in strings:
-                f.write(string)
-
-    def _truncate(self, s):
-        if len(s) > 33:
-            return s[:30] + "..."
-        else:
-            return s
-
-
-_Logger.DEFAULT = _Logger()
-_Logger.CURRENT = _Logger.DEFAULT
diff --git a/python/ray/rllib/agents/impala/impala.py b/python/ray/rllib/agents/impala/impala.py
index cfa55bd735c88..aa789387f9300 100644
--- a/python/ray/rllib/agents/impala/impala.py
+++ b/python/ray/rllib/agents/impala/impala.py
@@ -8,13 +8,24 @@
 from ray.rllib.agents.impala.vtrace_policy_graph import VTracePolicyGraph
 from ray.rllib.agents.agent import Agent, with_common_config
 from ray.rllib.optimizers import AsyncSamplesOptimizer
-from ray.tune.trial import Resources
+from ray.rllib.utils.annotations import override
 
 OPTIMIZER_SHARED_CONFIGS = [
+    "lr",
+    "num_envs_per_worker",
+    "num_gpus",
     "sample_batch_size",
     "train_batch_size",
+    "replay_buffer_num_slots",
+    "replay_proportion",
+    "num_parallel_data_loaders",
+    "grad_clip",
+    "max_sample_requests_in_flight_per_worker",
+    "broadcast_interval",
 ]
 
+# yapf: disable
+# __sphinx_doc_begin__
 DEFAULT_CONFIG = with_common_config({
     # V-trace params (see vtrace.py).
     "vtrace": True,
@@ -25,10 +36,22 @@
     "sample_batch_size": 50,
     "train_batch_size": 500,
     "min_iter_time_s": 10,
-    "gpu": True,
     "num_workers": 2,
-    "num_cpus_per_worker": 1,
-    "num_gpus_per_worker": 0,
+    # number of GPUs the learner should use.
+    "num_gpus": 1,
+    # set >1 to load data into GPUs in parallel. Increases GPU memory usage
+    # proportionally with the number of loaders.
+    "num_parallel_data_loaders": 1,
+    # level of queuing for sampling.
+    "max_sample_requests_in_flight_per_worker": 2,
+    # max number of workers to broadcast one set of weights to
+    "broadcast_interval": 1,
+    # set >0 to enable experience replay. Saved samples will be replayed with
+    # a p:1 proportion to new data samples.
+    "replay_proportion": 0.0,
+    # number of sample batches to store for replay. The number of transitions
+    # saved total will be (replay_buffer_num_slots * sample_batch_size).
+    "replay_buffer_num_slots": 100,
 
     # Learning params.
     "grad_clip": 40.0,
@@ -43,14 +66,9 @@
     # balancing the three losses
     "vf_loss_coeff": 0.5,
     "entropy_coeff": -0.01,
-
-    # Model and preprocessor options.
-    "model": {
-        "use_lstm": False,
-        "max_seq_len": 20,
-        "dim": 84,
-    },
 })
+# __sphinx_doc_end__
+# yapf: enable
 
 
 class ImpalaAgent(Agent):
@@ -60,15 +78,7 @@ class ImpalaAgent(Agent):
     _default_config = DEFAULT_CONFIG
     _policy_graph = VTracePolicyGraph
 
-    @classmethod
-    def default_resource_request(cls, config):
-        cf = dict(cls._default_config, **config)
-        return Resources(
-            cpu=1,
-            gpu=cf["gpu"] and cf["gpu_fraction"] or 0,
-            extra_cpu=cf["num_cpus_per_worker"] * cf["num_workers"],
-            extra_gpu=cf["num_gpus_per_worker"] * cf["num_workers"])
-
+    @override(Agent)
     def _init(self):
         for k in OPTIMIZER_SHARED_CONFIGS:
             if k not in self.config["optimizer"]:
@@ -80,19 +90,20 @@ def _init(self):
         self.local_evaluator = self.make_local_evaluator(
             self.env_creator, policy_cls)
         self.remote_evaluators = self.make_remote_evaluators(
-            self.env_creator, policy_cls, self.config["num_workers"],
-            {"num_cpus": 1})
+            self.env_creator, policy_cls, self.config["num_workers"])
         self.optimizer = AsyncSamplesOptimizer(self.local_evaluator,
                                                self.remote_evaluators,
                                                self.config["optimizer"])
 
+    @override(Agent)
     def _train(self):
         prev_steps = self.optimizer.num_steps_sampled
         start = time.time()
         self.optimizer.step()
         while time.time() - start < self.config["min_iter_time_s"]:
             self.optimizer.step()
-        result = self.optimizer.collect_metrics()
+        result = self.optimizer.collect_metrics(
+            self.config["collect_metrics_timeout"])
         result.update(timesteps_this_iter=self.optimizer.num_steps_sampled -
                       prev_steps)
         return result
diff --git a/python/ray/rllib/agents/impala/vtrace_policy_graph.py b/python/ray/rllib/agents/impala/vtrace_policy_graph.py
index 23f88e51f51b7..5eed0a6e79e5f 100644
--- a/python/ray/rllib/agents/impala/vtrace_policy_graph.py
+++ b/python/ray/rllib/agents/impala/vtrace_policy_graph.py
@@ -11,12 +11,14 @@
 
 import ray
 from ray.rllib.agents.impala import vtrace
+from ray.rllib.evaluation.policy_graph import PolicyGraph
 from ray.rllib.evaluation.tf_policy_graph import TFPolicyGraph, \
     LearningRateSchedule
 from ray.rllib.models.catalog import ModelCatalog
-from ray.rllib.models.misc import linear, normc_initializer
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.error import UnsupportedSpaceException
 from ray.rllib.utils.explained_variance import explained_variance
+from ray.rllib.models.action_dist import Categorical
 
 
 class VTraceLoss(object):
@@ -31,6 +33,7 @@ def __init__(self,
                  rewards,
                  values,
                  bootstrap_value,
+                 valid_mask,
                  vf_loss_coeff=0.5,
                  entropy_coeff=-0.01,
                  clip_rho_threshold=1.0,
@@ -52,6 +55,7 @@ def __init__(self,
             rewards: A float32 tensor of shape [T, B].
             values: A float32 tensor of shape [T, B].
             bootstrap_value: A float32 tensor of shape [B].
+            valid_mask: A bool tensor of valid RNN input elements (#2992).
         """
 
         # Compute vtrace on the CPU for better perf.
@@ -70,14 +74,16 @@ def __init__(self,
 
         # The policy gradients loss
         self.pi_loss = -tf.reduce_sum(
-            actions_logp * self.vtrace_returns.pg_advantages)
+            tf.boolean_mask(actions_logp * self.vtrace_returns.pg_advantages,
+                            valid_mask))
 
         # The baseline loss
-        delta = values - self.vtrace_returns.vs
+        delta = tf.boolean_mask(values - self.vtrace_returns.vs, valid_mask)
         self.vf_loss = 0.5 * tf.reduce_sum(tf.square(delta))
 
         # The entropy loss
-        self.entropy = tf.reduce_sum(actions_entropy)
+        self.entropy = tf.reduce_sum(
+            tf.boolean_mask(actions_entropy, valid_mask))
 
         # The summed weighted loss
         self.total_loss = (self.pi_loss + self.vf_loss * vf_loss_coeff +
@@ -85,40 +91,62 @@ def __init__(self,
 
 
 class VTracePolicyGraph(LearningRateSchedule, TFPolicyGraph):
-    def __init__(self, observation_space, action_space, config):
+    def __init__(self,
+                 observation_space,
+                 action_space,
+                 config,
+                 existing_inputs=None):
         config = dict(ray.rllib.agents.impala.impala.DEFAULT_CONFIG, **config)
         assert config["batch_mode"] == "truncate_episodes", \
             "Must use `truncate_episodes` batch mode with V-trace."
         self.config = config
         self.sess = tf.get_default_session()
 
+        # Create input placeholders
+        if existing_inputs:
+            actions, dones, behaviour_logits, rewards, observations, \
+                prev_actions, prev_rewards = existing_inputs[:7]
+            existing_state_in = existing_inputs[7:-1]
+            existing_seq_lens = existing_inputs[-1]
+        else:
+            if isinstance(action_space, gym.spaces.Discrete):
+                ac_size = action_space.n
+                actions = tf.placeholder(tf.int64, [None], name="ac")
+            else:
+                raise UnsupportedSpaceException(
+                    "Action space {} is not supported for IMPALA.".format(
+                        action_space))
+            dones = tf.placeholder(tf.bool, [None], name="dones")
+            rewards = tf.placeholder(tf.float32, [None], name="rewards")
+            behaviour_logits = tf.placeholder(
+                tf.float32, [None, ac_size], name="behaviour_logits")
+            observations = tf.placeholder(
+                tf.float32, [None] + list(observation_space.shape))
+            existing_state_in = None
+            existing_seq_lens = None
+
         # Setup the policy
-        self.observations = tf.placeholder(
-            tf.float32, [None] + list(observation_space.shape))
         dist_class, logit_dim = ModelCatalog.get_action_dist(
             action_space, self.config["model"])
-        self.model = ModelCatalog.get_model(self.observations, logit_dim,
-                                            self.config["model"])
+        prev_actions = ModelCatalog.get_action_placeholder(action_space)
+        prev_rewards = tf.placeholder(tf.float32, [None], name="prev_reward")
+        self.model = ModelCatalog.get_model(
+            {
+                "obs": observations,
+                "prev_actions": prev_actions,
+                "prev_rewards": prev_rewards,
+                "is_training": self._get_is_training_placeholder(),
+            },
+            observation_space,
+            logit_dim,
+            self.config["model"],
+            state_in=existing_state_in,
+            seq_lens=existing_seq_lens)
         action_dist = dist_class(self.model.outputs)
-        values = tf.reshape(
-            linear(self.model.last_layer, 1, "value", normc_initializer(1.0)),
-            [-1])
+        values = self.model.value_function()
         self.var_list = tf.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES,
                                           tf.get_variable_scope().name)
 
-        # Setup the policy loss
-        if isinstance(action_space, gym.spaces.Discrete):
-            ac_size = action_space.n
-            actions = tf.placeholder(tf.int64, [None], name="ac")
-        else:
-            raise UnsupportedSpaceException(
-                "Action space {} is not supported for IMPALA.".format(
-                    action_space))
-        dones = tf.placeholder(tf.bool, [None], name="dones")
-        rewards = tf.placeholder(tf.float32, [None], name="rewards")
-        behaviour_logits = tf.placeholder(
-            tf.float32, [None, ac_size], name="behaviour_logits")
-
         def to_batches(tensor):
             if self.config["model"]["use_lstm"]:
                 B = tf.shape(self.model.seq_lens)[0]
@@ -126,8 +154,7 @@ def to_batches(tensor):
             else:
                 # Important: chop the tensor into batches at known episode cut
                 # boundaries. TODO(ekl) this is kind of a hack
-                T = (self.config["sample_batch_size"] //
-                     self.config["num_envs_per_worker"])
+                T = self.config["sample_batch_size"]
                 B = tf.shape(tensor)[0] // T
             rs = tf.reshape(tensor,
                             tf.concat([[B, T], tf.shape(tensor)[1:]], axis=0))
@@ -136,6 +163,13 @@ def to_batches(tensor):
                 rs,
                 [1, 0] + list(range(2, 1 + int(tf.shape(tensor).shape[0]))))
 
+        if self.model.state_in:
+            max_seq_len = tf.reduce_max(self.model.seq_lens) - 1
+            mask = tf.sequence_mask(self.model.seq_lens, max_seq_len)
+            mask = tf.reshape(mask, [-1])
+        else:
+            mask = tf.ones_like(rewards)
+
         # Inputs are reshaped from [B * T] => [T - 1, B] for V-trace calc.
         self.loss = VTraceLoss(
             actions=to_batches(actions)[:-1],
@@ -148,18 +182,29 @@ def to_batches(tensor):
             rewards=to_batches(rewards)[:-1],
             values=to_batches(values)[:-1],
             bootstrap_value=to_batches(values)[-1],
+            valid_mask=to_batches(mask)[:-1],
             vf_loss_coeff=self.config["vf_loss_coeff"],
             entropy_coeff=self.config["entropy_coeff"],
             clip_rho_threshold=self.config["vtrace_clip_rho_threshold"],
             clip_pg_rho_threshold=self.config["vtrace_clip_pg_rho_threshold"])
 
+        # KL divergence between worker and learner logits for debugging
+        model_dist = Categorical(self.model.outputs)
+        behaviour_dist = Categorical(behaviour_logits)
+        self.KLs = model_dist.kl(behaviour_dist)
+        self.mean_KL = tf.reduce_mean(self.KLs)
+        self.max_KL = tf.reduce_max(self.KLs)
+        self.median_KL = tf.contrib.distributions.percentile(self.KLs, 50.0)
+
         # Initialize TFPolicyGraph
         loss_in = [
             ("actions", actions),
             ("dones", dones),
             ("behaviour_logits", behaviour_logits),
             ("rewards", rewards),
-            ("obs", self.observations),
+            ("obs", observations),
+            ("prev_actions", prev_actions),
+            ("prev_rewards", prev_rewards),
         ]
         LearningRateSchedule.__init__(self, self.config["lr"],
                                       self.config["lr_schedule"])
@@ -168,14 +213,17 @@ def to_batches(tensor):
             observation_space,
             action_space,
             self.sess,
-            obs_input=self.observations,
+            obs_input=observations,
             action_sampler=action_dist.sample(),
-            loss=self.loss.total_loss,
+            loss=self.model.loss() + self.loss.total_loss,
             loss_inputs=loss_in,
             state_inputs=self.model.state_in,
             state_outputs=self.model.state_out,
+            prev_action_input=prev_actions,
+            prev_reward_input=prev_rewards,
             seq_lens=self.model.seq_lens,
-            max_seq_len=self.config["model"]["max_seq_len"])
+            max_seq_len=self.config["model"]["max_seq_len"],
+            batch_divisibility_req=self.config["sample_batch_size"])
 
         self.sess.run(tf.global_variables_initializer())
 
@@ -190,9 +238,21 @@ def to_batches(tensor):
                 "vf_explained_var": explained_variance(
                     tf.reshape(self.loss.vtrace_returns.vs, [-1]),
                     tf.reshape(to_batches(values)[:-1], [-1])),
+                "mean_KL": self.mean_KL,
+                "max_KL": self.max_KL,
+                "median_KL": self.median_KL,
             },
         }
 
+    @override(TFPolicyGraph)
+    def copy(self, existing_inputs):
+        return VTracePolicyGraph(
+            self.observation_space,
+            self.action_space,
+            self.config,
+            existing_inputs=existing_inputs)
+
+    @override(TFPolicyGraph)
     def optimizer(self):
         if self.config["opt_type"] == "adam":
             return tf.train.AdamOptimizer(self.cur_lr)
@@ -201,21 +261,29 @@ def optimizer(self):
                                              self.config["momentum"],
                                              self.config["epsilon"])
 
+    @override(TFPolicyGraph)
     def gradients(self, optimizer):
         grads = tf.gradients(self.loss.total_loss, self.var_list)
         self.grads, _ = tf.clip_by_global_norm(grads, self.config["grad_clip"])
         clipped_grads = list(zip(self.grads, self.var_list))
         return clipped_grads
 
+    @override(TFPolicyGraph)
     def extra_compute_action_fetches(self):
         return {"behaviour_logits": self.model.outputs}
 
+    @override(TFPolicyGraph)
     def extra_compute_grad_fetches(self):
         return self.stats_fetches
 
-    def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
+    @override(PolicyGraph)
+    def postprocess_trajectory(self,
+                               sample_batch,
+                               other_agent_batches=None,
+                               episode=None):
         del sample_batch.data["new_obs"]  # not used, so save some bandwidth
         return sample_batch
 
+    @override(PolicyGraph)
     def get_initial_state(self):
         return self.model.state_init
diff --git a/python/ray/rllib/agents/mock.py b/python/ray/rllib/agents/mock.py
index 526ec146a8e2f..f4bf909918095 100644
--- a/python/ray/rllib/agents/mock.py
+++ b/python/ray/rllib/agents/mock.py
@@ -6,18 +6,19 @@
 import pickle
 import numpy as np
 
-from ray.rllib.agents.agent import Agent
+from ray.rllib.agents.agent import Agent, with_common_config
 
 
 class _MockAgent(Agent):
     """Mock agent for use in tests"""
 
     _agent_name = "MockAgent"
-    _default_config = {
+    _default_config = with_common_config({
         "mock_error": False,
         "persistent_error": False,
-        "test_variable": 1
-    }
+        "test_variable": 1,
+        "num_workers": 0,
+    })
 
     def _init(self):
         self.info = None
@@ -59,13 +60,14 @@ class _SigmoidFakeData(_MockAgent):
     This can be helpful for evaluating early stopping algorithms."""
 
     _agent_name = "SigmoidFakeData"
-    _default_config = {
+    _default_config = with_common_config({
         "width": 100,
         "height": 100,
         "offset": 0,
         "iter_time": 10,
         "iter_timesteps": 1,
-    }
+        "num_workers": 0,
+    })
 
     def _train(self):
         i = max(0, self.iteration - self.config["offset"])
@@ -82,13 +84,14 @@ def _train(self):
 class _ParameterTuningAgent(_MockAgent):
 
     _agent_name = "ParameterTuningAgent"
-    _default_config = {
+    _default_config = with_common_config({
         "reward_amt": 10,
         "dummy_param": 10,
         "dummy_param2": 15,
         "iter_time": 10,
-        "iter_timesteps": 1
-    }
+        "iter_timesteps": 1,
+        "num_workers": 0,
+    })
 
     def _train(self):
         return dict(
diff --git a/python/ray/rllib/agents/pg/pg.py b/python/ray/rllib/agents/pg/pg.py
index e1766e7744f23..69c6761863c6a 100644
--- a/python/ray/rllib/agents/pg/pg.py
+++ b/python/ray/rllib/agents/pg/pg.py
@@ -5,22 +5,18 @@
 from ray.rllib.agents.agent import Agent, with_common_config
 from ray.rllib.agents.pg.pg_policy_graph import PGPolicyGraph
 from ray.rllib.optimizers import SyncSamplesOptimizer
-from ray.rllib.utils import merge_dicts
-from ray.tune.trial import Resources
+from ray.rllib.utils.annotations import override
 
+# yapf: disable
+# __sphinx_doc_begin__
 DEFAULT_CONFIG = with_common_config({
     # No remote workers by default
     "num_workers": 0,
     # Learning rate
     "lr": 0.0004,
-    # Override model config
-    "model": {
-        # Use LSTM model.
-        "use_lstm": False,
-        # Max seq length for LSTM training.
-        "max_seq_len": 20,
-    },
 })
+# __sphinx_doc_end__
+# yapf: enable
 
 
 class PGAgent(Agent):
@@ -34,25 +30,22 @@ class PGAgent(Agent):
     _default_config = DEFAULT_CONFIG
     _policy_graph = PGPolicyGraph
 
-    @classmethod
-    def default_resource_request(cls, config):
-        cf = merge_dicts(cls._default_config, config)
-        return Resources(cpu=1, gpu=0, extra_cpu=cf["num_workers"])
-
+    @override(Agent)
     def _init(self):
         self.local_evaluator = self.make_local_evaluator(
             self.env_creator, self._policy_graph)
         self.remote_evaluators = self.make_remote_evaluators(
-            self.env_creator, self._policy_graph, self.config["num_workers"],
-            {})
+            self.env_creator, self._policy_graph, self.config["num_workers"])
         self.optimizer = SyncSamplesOptimizer(self.local_evaluator,
                                               self.remote_evaluators,
                                               self.config["optimizer"])
 
+    @override(Agent)
     def _train(self):
         prev_steps = self.optimizer.num_steps_sampled
         self.optimizer.step()
-        result = self.optimizer.collect_metrics()
+        result = self.optimizer.collect_metrics(
+            self.config["collect_metrics_timeout"])
         result.update(timesteps_this_iter=self.optimizer.num_steps_sampled -
                       prev_steps)
         return result
diff --git a/python/ray/rllib/agents/pg/pg_policy_graph.py b/python/ray/rllib/agents/pg/pg_policy_graph.py
index bb831c47d4ee4..59e9a9effc12b 100644
--- a/python/ray/rllib/agents/pg/pg_policy_graph.py
+++ b/python/ray/rllib/agents/pg/pg_policy_graph.py
@@ -7,25 +7,39 @@
 import ray
 from ray.rllib.models.catalog import ModelCatalog
 from ray.rllib.evaluation.postprocessing import compute_advantages
+from ray.rllib.evaluation.policy_graph import PolicyGraph
 from ray.rllib.evaluation.tf_policy_graph import TFPolicyGraph
+from ray.rllib.utils.annotations import override
 
 
 class PGLoss(object):
+    """Simple policy gradient loss."""
+
     def __init__(self, action_dist, actions, advantages):
         self.loss = -tf.reduce_mean(action_dist.logp(actions) * advantages)
 
 
 class PGPolicyGraph(TFPolicyGraph):
+    """Simple policy gradient example of defining a policy graph."""
+
     def __init__(self, obs_space, action_space, config):
         config = dict(ray.rllib.agents.pg.pg.DEFAULT_CONFIG, **config)
         self.config = config
 
-        # Setup policy
+        # Setup placeholders
         obs = tf.placeholder(tf.float32, shape=[None] + list(obs_space.shape))
         dist_class, self.logit_dim = ModelCatalog.get_action_dist(
             action_space, self.config["model"])
-        self.model = ModelCatalog.get_model(
-            obs, self.logit_dim, options=self.config["model"])
+        prev_actions = ModelCatalog.get_action_placeholder(action_space)
+        prev_rewards = tf.placeholder(tf.float32, [None], name="prev_reward")
+
+        # Create the model network and action outputs
+        self.model = ModelCatalog.get_model({
+            "obs": obs,
+            "prev_actions": prev_actions,
+            "prev_rewards": prev_rewards,
+            "is_training": self._get_is_training_placeholder(),
+        }, obs_space, self.logit_dim, self.config["model"])
         action_dist = dist_class(self.model.outputs)  # logit for each action
 
         # Setup policy loss
@@ -33,14 +47,19 @@ def __init__(self, obs_space, action_space, config):
         advantages = tf.placeholder(tf.float32, [None], name="adv")
         loss = PGLoss(action_dist, actions, advantages).loss
 
-        # Initialize TFPolicyGraph
-        sess = tf.get_default_session()
+        # Mapping from sample batch keys to placeholders. These keys will be
+        # read from postprocessed sample batches and fed into the specified
+        # placeholders during loss computation.
         loss_in = [
             ("obs", obs),
             ("actions", actions),
-            ("advantages", advantages),
+            ("prev_actions", prev_actions),
+            ("prev_rewards", prev_rewards),
+            ("advantages", advantages),  # added during postprocessing
         ]
 
+        # Initialize TFPolicyGraph
+        sess = tf.get_default_session()
         TFPolicyGraph.__init__(
             self,
             obs_space,
@@ -48,17 +67,25 @@ def __init__(self, obs_space, action_space, config):
             sess,
             obs_input=obs,
             action_sampler=action_dist.sample(),
-            loss=loss,
+            loss=self.model.loss() + loss,
             loss_inputs=loss_in,
             state_inputs=self.model.state_in,
             state_outputs=self.model.state_out,
+            prev_action_input=prev_actions,
+            prev_reward_input=prev_rewards,
             seq_lens=self.model.seq_lens,
             max_seq_len=config["model"]["max_seq_len"])
         sess.run(tf.global_variables_initializer())
 
-    def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
+    @override(PolicyGraph)
+    def postprocess_trajectory(self,
+                               sample_batch,
+                               other_agent_batches=None,
+                               episode=None):
+        # This adds the "advantages" column to the sample batch
         return compute_advantages(
             sample_batch, 0.0, self.config["gamma"], use_gae=False)
 
+    @override(PolicyGraph)
     def get_initial_state(self):
         return self.model.state_init
diff --git a/python/ray/rllib/agents/ppo/ppo.py b/python/ray/rllib/agents/ppo/ppo.py
index f452f789397ea..0c10b279ab221 100644
--- a/python/ray/rllib/agents/ppo/ppo.py
+++ b/python/ray/rllib/agents/ppo/ppo.py
@@ -2,12 +2,17 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
+
 from ray.rllib.agents import Agent, with_common_config
 from ray.rllib.agents.ppo.ppo_policy_graph import PPOPolicyGraph
-from ray.rllib.utils import merge_dicts
 from ray.rllib.optimizers import SyncSamplesOptimizer, LocalMultiGPUOptimizer
-from ray.tune.trial import Resources
+from ray.rllib.utils.annotations import override
+
+logger = logging.getLogger(__name__)
 
+# yapf: disable
+# __sphinx_doc_begin__
 DEFAULT_CONFIG = with_common_config({
     # If true, use the Generalized Advantage Estimator (GAE)
     # with a value function, see https://arxiv.org/pdf/1506.02438.pdf.
@@ -20,7 +25,7 @@
     "sample_batch_size": 200,
     # Number of timesteps collected for each SGD round
     "train_batch_size": 4000,
-    # Total SGD batch size across all devices for SGD (multi-gpu only)
+    # Total SGD batch size across all devices for SGD
     "sgd_minibatch_size": 128,
     # Number of SGD iterations in each outer loop
     "num_sgd_iter": 30,
@@ -41,26 +46,16 @@
     "vf_clip_param": 10.0,
     # Target value for KL divergence
     "kl_target": 0.01,
-    # Number of GPUs to use for SGD
-    "num_gpus": 0,
-    # Whether to allocate GPUs for workers (if > 0).
-    "num_gpus_per_worker": 0,
-    # Whether to allocate CPUs for workers (if > 0).
-    "num_cpus_per_worker": 1,
     # Whether to rollout "complete_episodes" or "truncate_episodes"
-    "batch_mode": "complete_episodes",
+    "batch_mode": "truncate_episodes",
     # Which observation filter to apply to the observation
     "observation_filter": "MeanStdFilter",
-    # Use the sync samples optimizer instead of the multi-gpu one
+    # Uses the sync samples optimizer instead of the multi-gpu one. This does
+    # not support minibatches.
     "simple_optimizer": False,
-    # Override model config
-    "model": {
-        # Whether to use LSTM model
-        "use_lstm": False,
-        # Max seq length for LSTM training.
-        "max_seq_len": 20,
-    },
 })
+# __sphinx_doc_end__
+# yapf: enable
 
 
 class PPOAgent(Agent):
@@ -70,39 +65,18 @@ class PPOAgent(Agent):
     _default_config = DEFAULT_CONFIG
     _policy_graph = PPOPolicyGraph
 
-    @classmethod
-    def default_resource_request(cls, config):
-        cf = merge_dicts(cls._default_config, config)
-        return Resources(
-            cpu=1,
-            gpu=cf["num_gpus"],
-            extra_cpu=cf["num_cpus_per_worker"] * cf["num_workers"],
-            extra_gpu=cf["num_gpus_per_worker"] * cf["num_workers"])
-
+    @override(Agent)
     def _init(self):
-        waste_ratio = (
-            self.config["sample_batch_size"] * self.config["num_workers"] /
-            self.config["train_batch_size"])
-        if waste_ratio > 1:
-            msg = ("sample_batch_size * num_workers >> train_batch_size. "
-                   "This means that many steps will be discarded. Consider "
-                   "reducing sample_batch_size, or increase train_batch_size.")
-            if waste_ratio > 1.5:
-                raise ValueError(msg)
-            else:
-                print("Warning: " + msg)
+        self._validate_config()
         self.local_evaluator = self.make_local_evaluator(
             self.env_creator, self._policy_graph)
         self.remote_evaluators = self.make_remote_evaluators(
-            self.env_creator, self._policy_graph, self.config["num_workers"], {
-                "num_cpus": self.config["num_cpus_per_worker"],
-                "num_gpus": self.config["num_gpus_per_worker"]
-            })
+            self.env_creator, self._policy_graph, self.config["num_workers"])
         if self.config["simple_optimizer"]:
             self.optimizer = SyncSamplesOptimizer(
                 self.local_evaluator, self.remote_evaluators, {
                     "num_sgd_iter": self.config["num_sgd_iter"],
-                    "train_batch_size": self.config["train_batch_size"]
+                    "train_batch_size": self.config["train_batch_size"],
                 })
         else:
             self.optimizer = LocalMultiGPUOptimizer(
@@ -114,6 +88,7 @@ def _init(self):
                     "standardize_fields": ["advantages"],
                 })
 
+    @override(Agent)
     def _train(self):
         prev_steps = self.optimizer.num_steps_sampled
         fetches = self.optimizer.step()
@@ -125,8 +100,42 @@ def _train(self):
             # multi-agent
             self.local_evaluator.foreach_trainable_policy(
                 lambda pi, pi_id: pi.update_kl(fetches[pi_id]["kl"]))
-        res = self.optimizer.collect_metrics()
+        res = self.optimizer.collect_metrics(
+            self.config["collect_metrics_timeout"])
         res.update(
             timesteps_this_iter=self.optimizer.num_steps_sampled - prev_steps,
             info=dict(fetches, **res.get("info", {})))
         return res
+
+    def _validate_config(self):
+        waste_ratio = (
+            self.config["sample_batch_size"] * self.config["num_workers"] /
+            self.config["train_batch_size"])
+        if waste_ratio > 1:
+            msg = ("sample_batch_size * num_workers >> train_batch_size. "
+                   "This means that many steps will be discarded. Consider "
+                   "reducing sample_batch_size, or increase train_batch_size.")
+            if waste_ratio > 1.5:
+                raise ValueError(msg)
+            else:
+                logger.warn(msg)
+        if self.config["sgd_minibatch_size"] > self.config["train_batch_size"]:
+            raise ValueError(
+                "Minibatch size {} must be <= train batch size {}.".format(
+                    self.config["sgd_minibatch_size"],
+                    self.config["train_batch_size"]))
+        if (self.config["batch_mode"] == "truncate_episodes"
+                and not self.config["use_gae"]):
+            raise ValueError(
+                "Episode truncation is not supported without a value function")
+        if (self.config["multiagent"]["policy_graphs"]
+                and not self.config["simple_optimizer"]):
+            logger.info(
+                "In multi-agent mode, policies will be optimized sequentially "
+                "by the multi-GPU optimizer. Consider setting "
+                "simple_optimizer=True if this doesn't work for you.")
+        if self.config["observation_filter"] != "NoFilter":
+            # TODO(ekl): consider setting the default to be NoFilter
+            logger.warn(
+                "By default, observations will be normalized with {}".format(
+                    self.config["observation_filter"]))
diff --git a/python/ray/rllib/agents/ppo/ppo_policy_graph.py b/python/ray/rllib/agents/ppo/ppo_policy_graph.py
index e6fc90d1ce948..6948d810a26be 100644
--- a/python/ray/rllib/agents/ppo/ppo_policy_graph.py
+++ b/python/ray/rllib/agents/ppo/ppo_policy_graph.py
@@ -6,10 +6,11 @@
 
 import ray
 from ray.rllib.evaluation.postprocessing import compute_advantages
+from ray.rllib.evaluation.policy_graph import PolicyGraph
 from ray.rllib.evaluation.tf_policy_graph import TFPolicyGraph, \
     LearningRateSchedule
 from ray.rllib.models.catalog import ModelCatalog
-from ray.rllib.models.misc import linear, normc_initializer
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.explained_variance import explained_variance
 
 
@@ -24,6 +25,7 @@ def __init__(self,
                  curr_action_dist,
                  value_fn,
                  cur_kl_coeff,
+                 valid_mask,
                  entropy_coeff=0,
                  clip_param=0.1,
                  vf_clip_param=0.1,
@@ -48,28 +50,33 @@ def __init__(self,
             value_fn (Tensor): Current value function output Tensor.
             cur_kl_coeff (Variable): Variable holding the current PPO KL
                 coefficient.
+            valid_mask (Tensor): A bool mask of valid input elements (#2992).
             entropy_coeff (float): Coefficient of the entropy regularizer.
             clip_param (float): Clip parameter
             vf_clip_param (float): Clip parameter for the value function
             vf_loss_coeff (float): Coefficient of the value function loss
             use_gae (bool): If true, use the Generalized Advantage Estimator.
         """
-        dist_cls, _ = ModelCatalog.get_action_dist(action_space)
+
+        def reduce_mean_valid(t):
+            return tf.reduce_mean(tf.boolean_mask(t, valid_mask))
+
+        dist_cls, _ = ModelCatalog.get_action_dist(action_space, {})
         prev_dist = dist_cls(logits)
         # Make loss functions.
         logp_ratio = tf.exp(
             curr_action_dist.logp(actions) - prev_dist.logp(actions))
         action_kl = prev_dist.kl(curr_action_dist)
-        self.mean_kl = tf.reduce_mean(action_kl)
+        self.mean_kl = reduce_mean_valid(action_kl)
 
         curr_entropy = curr_action_dist.entropy()
-        self.mean_entropy = tf.reduce_mean(curr_entropy)
+        self.mean_entropy = reduce_mean_valid(curr_entropy)
 
         surrogate_loss = tf.minimum(
             advantages * logp_ratio,
             advantages * tf.clip_by_value(logp_ratio, 1 - clip_param,
                                           1 + clip_param))
-        self.mean_policy_loss = tf.reduce_mean(-surrogate_loss)
+        self.mean_policy_loss = reduce_mean_valid(-surrogate_loss)
 
         if use_gae:
             vf_loss1 = tf.square(value_fn - value_targets)
@@ -77,14 +84,15 @@ def __init__(self,
                 value_fn - vf_preds, -vf_clip_param, vf_clip_param)
             vf_loss2 = tf.square(vf_clipped - value_targets)
             vf_loss = tf.maximum(vf_loss1, vf_loss2)
-            self.mean_vf_loss = tf.reduce_mean(vf_loss)
-            loss = tf.reduce_mean(-surrogate_loss + cur_kl_coeff * action_kl +
-                                  vf_loss_coeff * vf_loss -
-                                  entropy_coeff * curr_entropy)
+            self.mean_vf_loss = reduce_mean_valid(vf_loss)
+            loss = reduce_mean_valid(
+                -surrogate_loss + cur_kl_coeff * action_kl +
+                vf_loss_coeff * vf_loss - entropy_coeff * curr_entropy)
         else:
             self.mean_vf_loss = tf.constant(0.0)
-            loss = tf.reduce_mean(-surrogate_loss + cur_kl_coeff * action_kl -
-                                  entropy_coeff * curr_entropy)
+            loss = reduce_mean_valid(-surrogate_loss +
+                                     cur_kl_coeff * action_kl -
+                                     entropy_coeff * curr_entropy)
         self.loss = loss
 
 
@@ -108,12 +116,14 @@ def __init__(self,
         self.config = config
         self.kl_coeff_val = self.config["kl_coeff"]
         self.kl_target = self.config["kl_target"]
-        dist_cls, logit_dim = ModelCatalog.get_action_dist(action_space)
+        dist_cls, logit_dim = ModelCatalog.get_action_dist(
+            action_space, self.config["model"])
 
         if existing_inputs:
             obs_ph, value_targets_ph, adv_ph, act_ph, \
-                logits_ph, vf_preds_ph = existing_inputs[:6]
-            existing_state_in = existing_inputs[6:-1]
+                logits_ph, vf_preds_ph, prev_actions_ph, prev_rewards_ph = \
+                existing_inputs[:8]
+            existing_state_in = existing_inputs[8:-1]
             existing_seq_lens = existing_inputs[-1]
         else:
             obs_ph = tf.placeholder(
@@ -129,6 +139,9 @@ def __init__(self,
                 tf.float32, name="vf_preds", shape=(None, ))
             value_targets_ph = tf.placeholder(
                 tf.float32, name="value_targets", shape=(None, ))
+            prev_actions_ph = ModelCatalog.get_action_placeholder(action_space)
+            prev_rewards_ph = tf.placeholder(
+                tf.float32, [None], name="prev_reward")
             existing_state_in = None
             existing_seq_lens = None
         self.observations = obs_ph
@@ -140,9 +153,17 @@ def __init__(self,
             ("actions", act_ph),
             ("logits", logits_ph),
             ("vf_preds", vf_preds_ph),
+            ("prev_actions", prev_actions_ph),
+            ("prev_rewards", prev_rewards_ph),
         ]
         self.model = ModelCatalog.get_model(
-            obs_ph,
+            {
+                "obs": obs_ph,
+                "prev_actions": prev_actions_ph,
+                "prev_rewards": prev_rewards_ph,
+                "is_training": self._get_is_training_placeholder(),
+            },
+            observation_space,
             logit_dim,
             self.config["model"],
             state_in=existing_state_in,
@@ -161,9 +182,7 @@ def __init__(self,
         self.sampler = curr_action_dist.sample()
         if self.config["use_gae"]:
             if self.config["vf_share_layers"]:
-                self.value_function = tf.reshape(
-                    linear(self.model.last_layer, 1, "value",
-                           normc_initializer(1.0)), [-1])
+                self.value_function = self.model.value_function()
             else:
                 vf_config = self.config["model"].copy()
                 # Do not split the last layer of the value function into
@@ -172,12 +191,23 @@ def __init__(self,
                 vf_config["free_log_std"] = False
                 vf_config["use_lstm"] = False
                 with tf.variable_scope("value_function"):
-                    self.value_function = ModelCatalog.get_model(
-                        obs_ph, 1, vf_config).outputs
+                    self.value_function = ModelCatalog.get_model({
+                        "obs": obs_ph,
+                        "prev_actions": prev_actions_ph,
+                        "prev_rewards": prev_rewards_ph,
+                        "is_training": self._get_is_training_placeholder(),
+                    }, observation_space, 1, vf_config).outputs
                     self.value_function = tf.reshape(self.value_function, [-1])
         else:
             self.value_function = tf.zeros(shape=tf.shape(obs_ph)[:1])
 
+        if self.model.state_in:
+            max_seq_len = tf.reduce_max(self.model.seq_lens)
+            mask = tf.sequence_mask(self.model.seq_lens, max_seq_len)
+            mask = tf.reshape(mask, [-1])
+        else:
+            mask = tf.ones_like(adv_ph)
+
         self.loss_obj = PPOLoss(
             action_space,
             value_targets_ph,
@@ -188,6 +218,7 @@ def __init__(self,
             curr_action_dist,
             self.value_function,
             self.kl_coeff,
+            mask,
             entropy_coeff=self.config["entropy_coeff"],
             clip_param=self.config["clip_param"],
             vf_clip_param=self.config["vf_clip_param"],
@@ -203,10 +234,12 @@ def __init__(self,
             self.sess,
             obs_input=obs_ph,
             action_sampler=self.sampler,
-            loss=self.loss_obj.loss,
+            loss=self.model.loss() + self.loss_obj.loss,
             loss_inputs=self.loss_in,
             state_inputs=self.model.state_in,
             state_outputs=self.model.state_out,
+            prev_action_input=prev_actions_ph,
+            prev_reward_input=prev_rewards_ph,
             seq_lens=self.model.seq_lens,
             max_seq_len=config["model"]["max_seq_len"])
 
@@ -214,6 +247,7 @@ def __init__(self,
         self.explained_variance = explained_variance(value_targets_ph,
                                                      self.value_function)
         self.stats_fetches = {
+            "cur_kl_coeff": self.kl_coeff,
             "cur_lr": tf.cast(self.cur_lr, tf.float64),
             "total_loss": self.loss_obj.loss,
             "policy_loss": self.loss_obj.mean_policy_loss,
@@ -223,38 +257,20 @@ def __init__(self,
             "entropy": self.loss_obj.mean_entropy
         }
 
+    @override(TFPolicyGraph)
     def copy(self, existing_inputs):
         """Creates a copy of self using existing input placeholders."""
         return PPOPolicyGraph(
-            None,
+            self.observation_space,
             self.action_space,
             self.config,
             existing_inputs=existing_inputs)
 
-    def extra_compute_action_fetches(self):
-        return {"vf_preds": self.value_function, "logits": self.logits}
-
-    def extra_compute_grad_fetches(self):
-        return self.stats_fetches
-
-    def update_kl(self, sampled_kl):
-        if sampled_kl > 2.0 * self.kl_target:
-            self.kl_coeff_val *= 1.5
-        elif sampled_kl < 0.5 * self.kl_target:
-            self.kl_coeff_val *= 0.5
-        self.kl_coeff.load(self.kl_coeff_val, session=self.sess)
-        return self.kl_coeff_val
-
-    def value(self, ob, *args):
-        feed_dict = {self.observations: [ob], self.model.seq_lens: [1]}
-        assert len(args) == len(self.model.state_in), \
-            (args, self.model.state_in)
-        for k, v in zip(self.model.state_in, args):
-            feed_dict[k] = v
-        vf = self.sess.run(self.value_function, feed_dict)
-        return vf[0]
-
-    def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
+    @override(PolicyGraph)
+    def postprocess_trajectory(self,
+                               sample_batch,
+                               other_agent_batches=None,
+                               episode=None):
         completed = sample_batch["dones"][-1]
         if completed:
             last_r = 0.0
@@ -262,7 +278,7 @@ def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
             next_state = []
             for i in range(len(self.model.state_in)):
                 next_state.append([sample_batch["state_out_{}".format(i)][-1]])
-            last_r = self.value(sample_batch["new_obs"][-1], *next_state)
+            last_r = self._value(sample_batch["new_obs"][-1], *next_state)
         batch = compute_advantages(
             sample_batch,
             last_r,
@@ -271,9 +287,36 @@ def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
             use_gae=self.config["use_gae"])
         return batch
 
+    @override(TFPolicyGraph)
     def gradients(self, optimizer):
         return optimizer.compute_gradients(
             self._loss, colocate_gradients_with_ops=True)
 
+    @override(PolicyGraph)
     def get_initial_state(self):
         return self.model.state_init
+
+    @override(TFPolicyGraph)
+    def extra_compute_action_fetches(self):
+        return {"vf_preds": self.value_function, "logits": self.logits}
+
+    @override(TFPolicyGraph)
+    def extra_compute_grad_fetches(self):
+        return self.stats_fetches
+
+    def update_kl(self, sampled_kl):
+        if sampled_kl > 2.0 * self.kl_target:
+            self.kl_coeff_val *= 1.5
+        elif sampled_kl < 0.5 * self.kl_target:
+            self.kl_coeff_val *= 0.5
+        self.kl_coeff.load(self.kl_coeff_val, session=self.sess)
+        return self.kl_coeff_val
+
+    def _value(self, ob, *args):
+        feed_dict = {self.observations: [ob], self.model.seq_lens: [1]}
+        assert len(args) == len(self.model.state_in), \
+            (args, self.model.state_in)
+        for k, v in zip(self.model.state_in, args):
+            feed_dict[k] = v
+        vf = self.sess.run(self.value_function, feed_dict)
+        return vf[0]
diff --git a/python/ray/rllib/env/__init__.py b/python/ray/rllib/env/__init__.py
index 752d27cecf674..2e9ee49745d22 100644
--- a/python/ray/rllib/env/__init__.py
+++ b/python/ray/rllib/env/__init__.py
@@ -1,9 +1,11 @@
 from ray.rllib.env.async_vector_env import AsyncVectorEnv
 from ray.rllib.env.multi_agent_env import MultiAgentEnv
+from ray.rllib.env.external_env import ExternalEnv
 from ray.rllib.env.serving_env import ServingEnv
 from ray.rllib.env.vector_env import VectorEnv
 from ray.rllib.env.env_context import EnvContext
 
 __all__ = [
-    "AsyncVectorEnv", "MultiAgentEnv", "ServingEnv", "VectorEnv", "EnvContext"
+    "AsyncVectorEnv", "MultiAgentEnv", "ExternalEnv", "VectorEnv",
+    "ServingEnv", "EnvContext"
 ]
diff --git a/python/ray/rllib/env/async_vector_env.py b/python/ray/rllib/env/async_vector_env.py
index c2e5ab1d30864..72cd812de1eae 100644
--- a/python/ray/rllib/env/async_vector_env.py
+++ b/python/ray/rllib/env/async_vector_env.py
@@ -2,9 +2,10 @@
 from __future__ import division
 from __future__ import print_function
 
-from ray.rllib.env.serving_env import ServingEnv
+from ray.rllib.env.external_env import ExternalEnv
 from ray.rllib.env.vector_env import VectorEnv
 from ray.rllib.env.multi_agent_env import MultiAgentEnv
+from ray.rllib.utils.annotations import override
 
 
 class AsyncVectorEnv(object):
@@ -20,7 +21,13 @@ class AsyncVectorEnv(object):
 
         gym.Env => rllib.VectorEnv => rllib.AsyncVectorEnv
         rllib.MultiAgentEnv => rllib.AsyncVectorEnv
-        rllib.ServingEnv => rllib.AsyncVectorEnv
+        rllib.ExternalEnv => rllib.AsyncVectorEnv
+
+    Attributes:
+        action_space (gym.Space): Action space. This must be defined for
+            single-agent envs. Multi-agent envs can set this to None.
+        observation_space (gym.Space): Observation space. This must be defined
+            for single-agent envs. Multi-agent envs can set this to None.
 
     Examples:
         >>> env = MyAsyncVectorEnv()
@@ -64,11 +71,11 @@ def wrap_async(env, make_env=None, num_envs=1):
             if isinstance(env, MultiAgentEnv):
                 env = _MultiAgentEnvToAsync(
                     make_env=make_env, existing_envs=[env], num_envs=num_envs)
-            elif isinstance(env, ServingEnv):
+            elif isinstance(env, ExternalEnv):
                 if num_envs != 1:
                     raise ValueError(
-                        "ServingEnv does not currently support num_envs > 1.")
-                env = _ServingEnvToAsync(env)
+                        "ExternalEnv does not currently support num_envs > 1.")
+                env = _ExternalEnvToAsync(env)
             elif isinstance(env, VectorEnv):
                 env = _VectorEnvToAsync(env)
             else:
@@ -139,36 +146,52 @@ def _with_dummy_agent_id(env_id_to_values, dummy_id=_DUMMY_AGENT_ID):
     return {k: {dummy_id: v} for (k, v) in env_id_to_values.items()}
 
 
-class _ServingEnvToAsync(AsyncVectorEnv):
-    """Internal adapter of ServingEnv to AsyncVectorEnv."""
+class _ExternalEnvToAsync(AsyncVectorEnv):
+    """Internal adapter of ExternalEnv to AsyncVectorEnv."""
 
-    def __init__(self, serving_env):
-        self.serving_env = serving_env
-        serving_env.start()
+    def __init__(self, external_env, preprocessor=None):
+        self.external_env = external_env
+        self.prep = preprocessor
+        self.action_space = external_env.action_space
+        if preprocessor:
+            self.observation_space = preprocessor.observation_space
+        else:
+            self.observation_space = external_env.observation_space
+        external_env.start()
 
+    @override(AsyncVectorEnv)
     def poll(self):
-        with self.serving_env._results_avail_condition:
+        with self.external_env._results_avail_condition:
             results = self._poll()
             while len(results[0]) == 0:
-                self.serving_env._results_avail_condition.wait()
+                self.external_env._results_avail_condition.wait()
                 results = self._poll()
-                if not self.serving_env.isAlive():
+                if not self.external_env.isAlive():
                     raise Exception("Serving thread has stopped.")
-        limit = self.serving_env._max_concurrent_episodes
+        limit = self.external_env._max_concurrent_episodes
         assert len(results[0]) < limit, \
-            ("Too many concurrent episodes, were some leaked? This ServingEnv "
-             "was created with max_concurrent={}".format(limit))
+            ("Too many concurrent episodes, were some leaked? This "
+             "ExternalEnv was created with max_concurrent={}".format(limit))
         return results
 
+    @override(AsyncVectorEnv)
+    def send_actions(self, action_dict):
+        for eid, action in action_dict.items():
+            self.external_env._episodes[eid].action_queue.put(
+                action[_DUMMY_AGENT_ID])
+
     def _poll(self):
         all_obs, all_rewards, all_dones, all_infos = {}, {}, {}, {}
         off_policy_actions = {}
-        for eid, episode in self.serving_env._episodes.copy().items():
+        for eid, episode in self.external_env._episodes.copy().items():
             data = episode.get_data()
             if episode.cur_done:
-                del self.serving_env._episodes[eid]
+                del self.external_env._episodes[eid]
             if data:
-                all_obs[eid] = data["obs"]
+                if self.prep:
+                    all_obs[eid] = self.prep.transform(data["obs"])
+                else:
+                    all_obs[eid] = data["obs"]
                 all_rewards[eid] = data["reward"]
                 all_dones[eid] = data["done"]
                 all_infos[eid] = data["info"]
@@ -180,11 +203,6 @@ def _poll(self):
             _with_dummy_agent_id(all_infos), \
             _with_dummy_agent_id(off_policy_actions)
 
-    def send_actions(self, action_dict):
-        for eid, action in action_dict.items():
-            self.serving_env._episodes[eid].action_queue.put(
-                action[_DUMMY_AGENT_ID])
-
 
 class _VectorEnvToAsync(AsyncVectorEnv):
     """Internal adapter of VectorEnv to AsyncVectorEnv.
@@ -196,13 +214,18 @@ class _VectorEnvToAsync(AsyncVectorEnv):
 
     def __init__(self, vector_env):
         self.vector_env = vector_env
+        self.action_space = vector_env.action_space
+        self.observation_space = vector_env.observation_space
         self.num_envs = vector_env.num_envs
-        self.new_obs = self.vector_env.vector_reset()
+        self.new_obs = None  # lazily initialized
         self.cur_rewards = [None for _ in range(self.num_envs)]
         self.cur_dones = [False for _ in range(self.num_envs)]
         self.cur_infos = [None for _ in range(self.num_envs)]
 
+    @override(AsyncVectorEnv)
     def poll(self):
+        if self.new_obs is None:
+            self.new_obs = self.vector_env.vector_reset()
         new_obs = dict(enumerate(self.new_obs))
         rewards = dict(enumerate(self.cur_rewards))
         dones = dict(enumerate(self.cur_dones))
@@ -216,6 +239,7 @@ def poll(self):
             _with_dummy_agent_id(dones, "__all__"), \
             _with_dummy_agent_id(infos), {}
 
+    @override(AsyncVectorEnv)
     def send_actions(self, action_dict):
         action_vector = [None] * self.num_envs
         for i in range(self.num_envs):
@@ -223,9 +247,11 @@ def send_actions(self, action_dict):
         self.new_obs, self.cur_rewards, self.cur_dones, self.cur_infos = \
             self.vector_env.vector_step(action_vector)
 
+    @override(AsyncVectorEnv)
     def try_reset(self, env_id):
         return {_DUMMY_AGENT_ID: self.vector_env.reset_at(env_id)}
 
+    @override(AsyncVectorEnv)
     def get_unwrapped(self):
         return self.vector_env.get_unwrapped()
 
@@ -256,24 +282,39 @@ def __init__(self, make_env, existing_envs, num_envs):
             assert isinstance(env, MultiAgentEnv)
         self.env_states = [_MultiAgentEnvState(env) for env in self.envs]
 
+    @override(AsyncVectorEnv)
     def poll(self):
         obs, rewards, dones, infos = {}, {}, {}, {}
         for i, env_state in enumerate(self.env_states):
             obs[i], rewards[i], dones[i], infos[i] = env_state.poll()
         return obs, rewards, dones, infos, {}
 
+    @override(AsyncVectorEnv)
     def send_actions(self, action_dict):
         for env_id, agent_dict in action_dict.items():
             if env_id in self.dones:
                 raise ValueError("Env {} is already done".format(env_id))
             env = self.envs[env_id]
             obs, rewards, dones, infos = env.step(agent_dict)
+            assert isinstance(obs, dict), "Not a multi-agent obs"
+            assert isinstance(rewards, dict), "Not a multi-agent reward"
+            assert isinstance(dones, dict), "Not a multi-agent return"
+            assert isinstance(infos, dict), "Not a multi-agent info"
+            if set(obs.keys()) != set(rewards.keys()):
+                raise ValueError(
+                    "Key set for obs and rewards must be the same: "
+                    "{} vs {}".format(obs.keys(), rewards.keys()))
+            if set(obs.keys()) != set(infos.keys()):
+                raise ValueError("Key set for obs and infos must be the same: "
+                                 "{} vs {}".format(obs.keys(), infos.keys()))
             if dones["__all__"]:
                 self.dones.add(env_id)
             self.env_states[env_id].observe(obs, rewards, dones, infos)
 
+    @override(AsyncVectorEnv)
     def try_reset(self, env_id):
         obs = self.env_states[env_id].reset()
+        assert isinstance(obs, dict), "Not a multi-agent obs"
         if obs is not None and env_id in self.dones:
             self.dones.remove(env_id)
         return obs
diff --git a/python/ray/rllib/env/external_env.py b/python/ray/rllib/env/external_env.py
new file mode 100644
index 0000000000000..e71c816256dcc
--- /dev/null
+++ b/python/ray/rllib/env/external_env.py
@@ -0,0 +1,226 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from six.moves import queue
+import threading
+import uuid
+
+
+class ExternalEnv(threading.Thread):
+    """An environment that interfaces with external agents.
+
+    Unlike simulator envs, control is inverted. The environment queries the
+    policy to obtain actions and logs observations and rewards for training.
+    This is in contrast to gym.Env, where the algorithm drives the simulation
+    through env.step() calls.
+
+    You can use ExternalEnv as the backend for policy serving (by serving HTTP
+    requests in the run loop), for ingesting offline logs data (by reading
+    offline transitions in the run loop), or other custom use cases not easily
+    expressed through gym.Env.
+
+    ExternalEnv supports both on-policy actions (through self.get_action()),
+    and off-policy actions (through self.log_action()).
+
+    This env is thread-safe, but individual episodes must be executed serially.
+
+    Attributes:
+        action_space (gym.Space): Action space.
+        observation_space (gym.Space): Observation space.
+
+    Examples:
+        >>> register_env("my_env", lambda config: YourExternalEnv(config))
+        >>> agent = DQNAgent(env="my_env")
+        >>> while True:
+              print(agent.train())
+    """
+
+    def __init__(self, action_space, observation_space, max_concurrent=100):
+        """Initialize an external env.
+
+        ExternalEnv subclasses must call this during their __init__.
+
+        Arguments:
+            action_space (gym.Space): Action space of the env.
+            observation_space (gym.Space): Observation space of the env.
+            max_concurrent (int): Max number of active episodes to allow at
+                once. Exceeding this limit raises an error.
+        """
+
+        threading.Thread.__init__(self)
+        self.daemon = True
+        self.action_space = action_space
+        self.observation_space = observation_space
+        self._episodes = {}
+        self._finished = set()
+        self._results_avail_condition = threading.Condition()
+        self._max_concurrent_episodes = max_concurrent
+
+    def run(self):
+        """Override this to implement the run loop.
+
+        Your loop should continuously:
+            1. Call self.start_episode(episode_id)
+            2. Call self.get_action(episode_id, obs)
+                    -or-
+                    self.log_action(episode_id, obs, action)
+            3. Call self.log_returns(episode_id, reward)
+            4. Call self.end_episode(episode_id, obs)
+            5. Wait if nothing to do.
+
+        Multiple episodes may be started at the same time.
+        """
+        raise NotImplementedError
+
+    def start_episode(self, episode_id=None, training_enabled=True):
+        """Record the start of an episode.
+
+        Arguments:
+            episode_id (str): Unique string id for the episode or None for
+                it to be auto-assigned.
+            training_enabled (bool): Whether to use experiences for this
+                episode to improve the policy.
+
+        Returns:
+            episode_id (str): Unique string id for the episode.
+        """
+
+        if episode_id is None:
+            episode_id = uuid.uuid4().hex
+
+        if episode_id in self._finished:
+            raise ValueError(
+                "Episode {} has already completed.".format(episode_id))
+
+        if episode_id in self._episodes:
+            raise ValueError(
+                "Episode {} is already started".format(episode_id))
+
+        self._episodes[episode_id] = _ExternalEnvEpisode(
+            episode_id, self._results_avail_condition, training_enabled)
+
+        return episode_id
+
+    def get_action(self, episode_id, observation):
+        """Record an observation and get the on-policy action.
+
+        Arguments:
+            episode_id (str): Episode id returned from start_episode().
+            observation (obj): Current environment observation.
+
+        Returns:
+            action (obj): Action from the env action space.
+        """
+
+        episode = self._get(episode_id)
+        return episode.wait_for_action(observation)
+
+    def log_action(self, episode_id, observation, action):
+        """Record an observation and (off-policy) action taken.
+
+        Arguments:
+            episode_id (str): Episode id returned from start_episode().
+            observation (obj): Current environment observation.
+            action (obj): Action for the observation.
+        """
+
+        episode = self._get(episode_id)
+        episode.log_action(observation, action)
+
+    def log_returns(self, episode_id, reward, info=None):
+        """Record returns from the environment.
+
+        The reward will be attributed to the previous action taken by the
+        episode. Rewards accumulate until the next action. If no reward is
+        logged before the next action, a reward of 0.0 is assumed.
+
+        Arguments:
+            episode_id (str): Episode id returned from start_episode().
+            reward (float): Reward from the environment.
+            info (dict): Optional info dict.
+        """
+
+        episode = self._get(episode_id)
+        episode.cur_reward += reward
+        if info:
+            episode.cur_info = info or {}
+
+    def end_episode(self, episode_id, observation):
+        """Record the end of an episode.
+
+        Arguments:
+            episode_id (str): Episode id returned from start_episode().
+            observation (obj): Current environment observation.
+        """
+
+        episode = self._get(episode_id)
+        self._finished.add(episode.episode_id)
+        episode.done(observation)
+
+    def _get(self, episode_id):
+        """Get a started episode or raise an error."""
+
+        if episode_id in self._finished:
+            raise ValueError(
+                "Episode {} has already completed.".format(episode_id))
+
+        if episode_id not in self._episodes:
+            raise ValueError("Episode {} not found.".format(episode_id))
+
+        return self._episodes[episode_id]
+
+
+class _ExternalEnvEpisode(object):
+    """Tracked state for each active episode."""
+
+    def __init__(self, episode_id, results_avail_condition, training_enabled):
+        self.episode_id = episode_id
+        self.results_avail_condition = results_avail_condition
+        self.training_enabled = training_enabled
+        self.data_queue = queue.Queue()
+        self.action_queue = queue.Queue()
+        self.new_observation = None
+        self.new_action = None
+        self.cur_reward = 0.0
+        self.cur_done = False
+        self.cur_info = {}
+
+    def get_data(self):
+        if self.data_queue.empty():
+            return None
+        return self.data_queue.get_nowait()
+
+    def log_action(self, observation, action):
+        self.new_observation = observation
+        self.new_action = action
+        self._send()
+        self.action_queue.get(True, timeout=60.0)
+
+    def wait_for_action(self, observation):
+        self.new_observation = observation
+        self._send()
+        return self.action_queue.get(True, timeout=60.0)
+
+    def done(self, observation):
+        self.new_observation = observation
+        self.cur_done = True
+        self._send()
+
+    def _send(self):
+        item = {
+            "obs": self.new_observation,
+            "reward": self.cur_reward,
+            "done": self.cur_done,
+            "info": self.cur_info,
+        }
+        if self.new_action is not None:
+            item["off_policy_action"] = self.new_action
+        if not self.training_enabled:
+            item["info"]["training_enabled"] = False
+        self.new_observation = None
+        self.new_action = None
+        self.cur_reward = 0.0
+        with self.results_avail_condition:
+            self.data_queue.put_nowait(item)
+            self.results_avail_condition.notify()
diff --git a/python/ray/rllib/env/multi_agent_env.py b/python/ray/rllib/env/multi_agent_env.py
index 42f7cee8c0428..2e569230a2120 100644
--- a/python/ray/rllib/env/multi_agent_env.py
+++ b/python/ray/rllib/env/multi_agent_env.py
@@ -56,7 +56,7 @@ def step(self, action_dict):
             rewards (dict): Reward values for each ready agent. If the
                 episode is just started, the value will be None.
             dones (dict): Done values for each ready agent. The special key
-                "__all__" is used to indicate env termination.
+                "__all__" (required) is used to indicate env termination.
             infos (dict): Info values for each ready agent.
         """
         raise NotImplementedError
diff --git a/python/ray/rllib/env/serving_env.py b/python/ray/rllib/env/serving_env.py
index 0c1e3ec0dbfe4..cb976bf8041e9 100644
--- a/python/ray/rllib/env/serving_env.py
+++ b/python/ray/rllib/env/serving_env.py
@@ -2,219 +2,7 @@
 from __future__ import division
 from __future__ import print_function
 
-from six.moves import queue
-import threading
-import uuid
+from ray.rllib.env.external_env import ExternalEnv
 
-
-class ServingEnv(threading.Thread):
-    """An environment that provides policy serving.
-
-    Unlike simulator envs, control is inverted. The environment queries the
-    policy to obtain actions and logs observations and rewards for training.
-    This is in contrast to gym.Env, where the algorithm drives the simulation
-    through env.step() calls.
-
-    You can use ServingEnv as the backend for policy serving (by serving HTTP
-    requests in the run loop), for ingesting offline logs data (by reading
-    offline transitions in the run loop), or other custom use cases not easily
-    expressed through gym.Env.
-
-    ServingEnv supports both on-policy serving (through self.get_action()), and
-    off-policy serving (through self.log_action()).
-
-    This env is thread-safe, but individual episodes must be executed serially.
-
-    Examples:
-        >>> register_env("my_env", lambda config: YourServingEnv(config))
-        >>> agent = DQNAgent(env="my_env")
-        >>> while True:
-              print(agent.train())
-    """
-
-    def __init__(self, action_space, observation_space, max_concurrent=100):
-        """Initialize a serving env.
-
-        ServingEnv subclasses must call this during their __init__.
-
-        Arguments:
-            action_space (gym.Space): Action space of the env.
-            observation_space (gym.Space): Observation space of the env.
-            max_concurrent (int): Max number of active episodes to allow at
-                once. Exceeding this limit raises an error.
-        """
-
-        threading.Thread.__init__(self)
-        self.daemon = True
-        self.action_space = action_space
-        self.observation_space = observation_space
-        self._episodes = {}
-        self._finished = set()
-        self._results_avail_condition = threading.Condition()
-        self._max_concurrent_episodes = max_concurrent
-
-    def run(self):
-        """Override this to implement the run loop.
-
-        Your loop should continuously:
-            1. Call self.start_episode()
-            2. Call self.get_action() or self.log_action()
-            3. Call self.log_returns()
-            4. Call self.end_episode()
-            5. Wait if nothing to do.
-
-        Multiple episodes may be started at the same time.
-        """
-        raise NotImplementedError
-
-    def start_episode(self, episode_id=None, training_enabled=True):
-        """Record the start of an episode.
-
-        Arguments:
-            episode_id (str): Unique string id for the episode or None for
-                it to be auto-assigned.
-            training_enabled (bool): Whether to use experiences for this
-                episode to improve the policy.
-
-        Returns:
-            episode_id (str): Unique string id for the episode.
-        """
-
-        if episode_id is None:
-            episode_id = uuid.uuid4().hex
-
-        if episode_id in self._finished:
-            raise ValueError(
-                "Episode {} has already completed.".format(episode_id))
-
-        if episode_id in self._episodes:
-            raise ValueError(
-                "Episode {} is already started".format(episode_id))
-
-        self._episodes[episode_id] = _ServingEnvEpisode(
-            episode_id, self._results_avail_condition, training_enabled)
-
-        return episode_id
-
-    def get_action(self, episode_id, observation):
-        """Record an observation and get the on-policy action.
-
-        Arguments:
-            episode_id (str): Episode id returned from start_episode().
-            observation (obj): Current environment observation.
-
-        Returns:
-            action (obj): Action from the env action space.
-        """
-
-        episode = self._get(episode_id)
-        return episode.wait_for_action(observation)
-
-    def log_action(self, episode_id, observation, action):
-        """Record an observation and (off-policy) action taken.
-
-        Arguments:
-            episode_id (str): Episode id returned from start_episode().
-            observation (obj): Current environment observation.
-            action (obj): Action for the observation.
-        """
-
-        episode = self._get(episode_id)
-        episode.log_action(observation, action)
-
-    def log_returns(self, episode_id, reward, info=None):
-        """Record returns from the environment.
-
-        The reward will be attributed to the previous action taken by the
-        episode. Rewards accumulate until the next action. If no reward is
-        logged before the next action, a reward of 0.0 is assumed.
-
-        Arguments:
-            episode_id (str): Episode id returned from start_episode().
-            reward (float): Reward from the environment.
-            info (dict): Optional info dict.
-        """
-
-        episode = self._get(episode_id)
-        episode.cur_reward += reward
-        if info:
-            episode.cur_info = info or {}
-
-    def end_episode(self, episode_id, observation):
-        """Record the end of an episode.
-
-        Arguments:
-            episode_id (str): Episode id returned from start_episode().
-            observation (obj): Current environment observation.
-        """
-
-        episode = self._get(episode_id)
-        self._finished.add(episode.episode_id)
-        episode.done(observation)
-
-    def _get(self, episode_id):
-        """Get a started episode or raise an error."""
-
-        if episode_id in self._finished:
-            raise ValueError(
-                "Episode {} has already completed.".format(episode_id))
-
-        if episode_id not in self._episodes:
-            raise ValueError("Episode {} not found.".format(episode_id))
-
-        return self._episodes[episode_id]
-
-
-class _ServingEnvEpisode(object):
-    """Tracked state for each active episode."""
-
-    def __init__(self, episode_id, results_avail_condition, training_enabled):
-        self.episode_id = episode_id
-        self.results_avail_condition = results_avail_condition
-        self.training_enabled = training_enabled
-        self.data_queue = queue.Queue()
-        self.action_queue = queue.Queue()
-        self.new_observation = None
-        self.new_action = None
-        self.cur_reward = 0.0
-        self.cur_done = False
-        self.cur_info = {}
-
-    def get_data(self):
-        if self.data_queue.empty():
-            return None
-        return self.data_queue.get_nowait()
-
-    def log_action(self, observation, action):
-        self.new_observation = observation
-        self.new_action = action
-        self._send()
-        self.action_queue.get(True, timeout=60.0)
-
-    def wait_for_action(self, observation):
-        self.new_observation = observation
-        self._send()
-        return self.action_queue.get(True, timeout=60.0)
-
-    def done(self, observation):
-        self.new_observation = observation
-        self.cur_done = True
-        self._send()
-
-    def _send(self):
-        item = {
-            "obs": self.new_observation,
-            "reward": self.cur_reward,
-            "done": self.cur_done,
-            "info": self.cur_info,
-        }
-        if self.new_action is not None:
-            item["off_policy_action"] = self.new_action
-        if not self.training_enabled:
-            item["info"]["training_enabled"] = False
-        self.new_observation = None
-        self.new_action = None
-        self.cur_reward = 0.0
-        with self.results_avail_condition:
-            self.data_queue.put_nowait(item)
-            self.results_avail_condition.notify()
+# renamed to ExternalEnv in 0.6
+ServingEnv = ExternalEnv
diff --git a/python/ray/rllib/env/vector_env.py b/python/ray/rllib/env/vector_env.py
index 7fb5b1605543e..c2eb1692061ce 100644
--- a/python/ray/rllib/env/vector_env.py
+++ b/python/ray/rllib/env/vector_env.py
@@ -2,6 +2,8 @@
 from __future__ import division
 from __future__ import print_function
 
+from ray.rllib.utils.annotations import override
+
 
 class VectorEnv(object):
     """An environment that supports batch evaluation.
@@ -69,13 +71,18 @@ def __init__(self, make_env, existing_envs, num_envs):
         self.num_envs = num_envs
         while len(self.envs) < self.num_envs:
             self.envs.append(self.make_env(len(self.envs)))
+        self.action_space = self.envs[0].action_space
+        self.observation_space = self.envs[0].observation_space
 
+    @override(VectorEnv)
     def vector_reset(self):
         return [e.reset() for e in self.envs]
 
+    @override(VectorEnv)
     def reset_at(self, index):
         return self.envs[index].reset()
 
+    @override(VectorEnv)
     def vector_step(self, actions):
         obs_batch, rew_batch, done_batch, info_batch = [], [], [], []
         for i in range(self.num_envs):
@@ -86,5 +93,6 @@ def vector_step(self, actions):
             info_batch.append(info)
         return obs_batch, rew_batch, done_batch, info_batch
 
+    @override(VectorEnv)
     def get_unwrapped(self):
         return self.envs
diff --git a/python/ray/rllib/evaluation/episode.py b/python/ray/rllib/evaluation/episode.py
index fc99d79fbb041..11977745184d5 100644
--- a/python/ray/rllib/evaluation/episode.py
+++ b/python/ray/rllib/evaluation/episode.py
@@ -7,13 +7,15 @@
 
 import numpy as np
 
+from ray.rllib.env.async_vector_env import _DUMMY_AGENT_ID
+
 
 class MultiAgentEpisode(object):
     """Tracks the current state of a (possibly multi-agent) episode.
 
     The APIs in this class should be considered experimental, but we should
     avoid changing things for the sake of changing them since users may
-    depend on them for advanced algorithms.
+    depend on them for custom metrics or advanced algorithms.
 
     Attributes:
         new_batch_builder (func): Create a new MultiAgentSampleBatchBuilder.
@@ -23,6 +25,8 @@ class MultiAgentEpisode(object):
         length (int): Length of this episode.
         episode_id (int): Unique id identifying this trajectory.
         agent_rewards (dict): Summed rewards broken down by agent.
+        custom_metrics (dict): Dict where the you can add custom metrics.
+        user_data (dict): Dict that you can use for temporary storage.
 
     Use case 1: Model-based rollouts in multi-agent:
         A custom compute_actions() function in a policy graph can inspect the
@@ -47,15 +51,22 @@ def __init__(self, policies, policy_mapping_fn, batch_builder_factory,
         self.length = 0
         self.episode_id = random.randrange(2e9)
         self.agent_rewards = defaultdict(float)
+        self.custom_metrics = {}
+        self.user_data = {}
         self._policies = policies
         self._policy_mapping_fn = policy_mapping_fn
+        self._next_agent_index = 0
+        self._agent_to_index = {}
         self._agent_to_policy = {}
         self._agent_to_rnn_state = {}
         self._agent_to_last_obs = {}
+        self._agent_to_last_info = {}
         self._agent_to_last_action = {}
         self._agent_to_last_pi_info = {}
+        self._agent_to_prev_action = {}
+        self._agent_reward_history = defaultdict(list)
 
-    def policy_for(self, agent_id):
+    def policy_for(self, agent_id=_DUMMY_AGENT_ID):
         """Returns the policy graph for the specified agent.
 
         If the agent is new, the policy mapping fn will be called to bind the
@@ -66,27 +77,46 @@ def policy_for(self, agent_id):
             self._agent_to_policy[agent_id] = self._policy_mapping_fn(agent_id)
         return self._agent_to_policy[agent_id]
 
-    def last_observation_for(self, agent_id):
+    def last_observation_for(self, agent_id=_DUMMY_AGENT_ID):
         """Returns the last observation for the specified agent."""
 
         return self._agent_to_last_obs.get(agent_id)
 
-    def last_action_for(self, agent_id):
-        """Returns the last action for the specified agent."""
-
-        action = self._agent_to_last_action[agent_id]
-        # Concatenate tuple actions
-        if isinstance(action, list):
-            expanded = []
-            for a in action:
-                if len(a.shape) == 1:
-                    expanded.append(np.expand_dims(a, 1))
-                else:
-                    expanded.append(a)
-            action = np.concatenate(expanded, axis=1).flatten()
-        return action
-
-    def rnn_state_for(self, agent_id):
+    def last_info_for(self, agent_id=_DUMMY_AGENT_ID):
+        """Returns the last info for the specified agent."""
+
+        return self._agent_to_last_info.get(agent_id)
+
+    def last_action_for(self, agent_id=_DUMMY_AGENT_ID):
+        """Returns the last action for the specified agent, or zeros."""
+
+        if agent_id in self._agent_to_last_action:
+            return _flatten_action(self._agent_to_last_action[agent_id])
+        else:
+            policy = self._policies[self.policy_for(agent_id)]
+            flat = _flatten_action(policy.action_space.sample())
+            return np.zeros_like(flat)
+
+    def prev_action_for(self, agent_id=_DUMMY_AGENT_ID):
+        """Returns the previous action for the specified agent."""
+
+        if agent_id in self._agent_to_prev_action:
+            return _flatten_action(self._agent_to_prev_action[agent_id])
+        else:
+            # We're at t=0, so return all zeros.
+            return np.zeros_like(self.last_action_for(agent_id))
+
+    def prev_reward_for(self, agent_id=_DUMMY_AGENT_ID):
+        """Returns the previous reward for the specified agent."""
+
+        history = self._agent_reward_history[agent_id]
+        if len(history) >= 2:
+            return history[-2]
+        else:
+            # We're at t=0, so there is no previous reward, just return zero.
+            return 0.0
+
+    def rnn_state_for(self, agent_id=_DUMMY_AGENT_ID):
         """Returns the last RNN state for the specified agent."""
 
         if agent_id not in self._agent_to_rnn_state:
@@ -94,7 +124,7 @@ def rnn_state_for(self, agent_id):
             self._agent_to_rnn_state[agent_id] = policy.get_initial_state()
         return self._agent_to_rnn_state[agent_id]
 
-    def last_pi_info_for(self, agent_id):
+    def last_pi_info_for(self, agent_id=_DUMMY_AGENT_ID):
         """Returns the last info object for the specified agent."""
 
         return self._agent_to_last_pi_info[agent_id]
@@ -105,6 +135,7 @@ def _add_agent_rewards(self, reward_dict):
                 self.agent_rewards[agent_id,
                                    self.policy_for(agent_id)] += reward
                 self.total_reward += reward
+                self._agent_reward_history[agent_id].append(reward)
 
     def _set_rnn_state(self, agent_id, rnn_state):
         self._agent_to_rnn_state[agent_id] = rnn_state
@@ -112,8 +143,30 @@ def _set_rnn_state(self, agent_id, rnn_state):
     def _set_last_observation(self, agent_id, obs):
         self._agent_to_last_obs[agent_id] = obs
 
+    def _set_last_info(self, agent_id, info):
+        self._agent_to_last_info[agent_id] = info
+
     def _set_last_action(self, agent_id, action):
         self._agent_to_last_action[agent_id] = action
 
     def _set_last_pi_info(self, agent_id, pi_info):
         self._agent_to_last_pi_info[agent_id] = pi_info
+
+    def _agent_index(self, agent_id):
+        if agent_id not in self._agent_to_index:
+            self._agent_to_index[agent_id] = self._next_agent_index
+            self._next_agent_index += 1
+        return self._agent_to_index[agent_id]
+
+
+def _flatten_action(action):
+    # Concatenate tuple actions
+    if isinstance(action, list) or isinstance(action, tuple):
+        expanded = []
+        for a in action:
+            if not hasattr(a, "shape") or len(a.shape) == 0:
+                expanded.append(np.expand_dims(a, 1))
+            else:
+                expanded.append(a)
+        action = np.concatenate(expanded, axis=0).flatten()
+    return action
diff --git a/python/ray/rllib/evaluation/metrics.py b/python/ray/rllib/evaluation/metrics.py
index dc71c4ecd1185..92c357d117e85 100644
--- a/python/ray/rllib/evaluation/metrics.py
+++ b/python/ray/rllib/evaluation/metrics.py
@@ -2,48 +2,69 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
 import numpy as np
 import collections
 
 import ray
 from ray.rllib.evaluation.sample_batch import DEFAULT_POLICY_ID
 
+logger = logging.getLogger(__name__)
 
-def collect_metrics(local_evaluator, remote_evaluators=[]):
+
+def collect_metrics(local_evaluator, remote_evaluators=[],
+                    timeout_seconds=180):
     """Gathers episode metrics from PolicyEvaluator instances."""
 
-    episodes = collect_episodes(local_evaluator, remote_evaluators)
-    return summarize_episodes(episodes, episodes)
+    episodes, num_dropped = collect_episodes(
+        local_evaluator, remote_evaluators, timeout_seconds=timeout_seconds)
+    metrics = summarize_episodes(episodes, episodes, num_dropped)
+    return metrics
 
 
-def collect_episodes(local_evaluator, remote_evaluators=[]):
+def collect_episodes(local_evaluator,
+                     remote_evaluators=[],
+                     timeout_seconds=180):
     """Gathers new episodes metrics tuples from the given evaluators."""
 
-    metric_lists = ray.get([
+    pending = [
         a.apply.remote(lambda ev: ev.sampler.get_metrics())
         for a in remote_evaluators
-    ])
+    ]
+    collected, _ = ray.wait(
+        pending, num_returns=len(pending), timeout=timeout_seconds * 1000)
+    num_metric_batches_dropped = len(pending) - len(collected)
+
+    metric_lists = ray.get(collected)
     metric_lists.append(local_evaluator.sampler.get_metrics())
     episodes = []
     for metrics in metric_lists:
         episodes.extend(metrics)
-    return episodes
+    return episodes, num_metric_batches_dropped
 
 
-def summarize_episodes(episodes, new_episodes):
+def summarize_episodes(episodes, new_episodes, num_dropped):
     """Summarizes a set of episode metrics tuples.
 
     Arguments:
         episodes: smoothed set of episodes including historical ones
         new_episodes: just the new episodes in this iteration
+        num_dropped: number of workers haven't returned their metrics
     """
 
+    if num_dropped > 0:
+        logger.warn("WARNING: {} workers have NOT returned metrics".format(
+            num_dropped))
+
     episode_rewards = []
     episode_lengths = []
     policy_rewards = collections.defaultdict(list)
+    custom_metrics = collections.defaultdict(list)
     for episode in episodes:
         episode_lengths.append(episode.episode_length)
         episode_rewards.append(episode.episode_reward)
+        for k, v in episode.custom_metrics.items():
+            custom_metrics[k].append(v)
         for (_, policy_id), reward in episode.agent_rewards.items():
             if policy_id != DEFAULT_POLICY_ID:
                 policy_rewards[policy_id].append(reward)
@@ -59,10 +80,23 @@ def summarize_episodes(episodes, new_episodes):
     for policy_id, rewards in policy_rewards.copy().items():
         policy_rewards[policy_id] = np.mean(rewards)
 
+    for k, v_list in custom_metrics.copy().items():
+        custom_metrics[k + "_mean"] = np.mean(v_list)
+        filt = [v for v in v_list if not np.isnan(v)]
+        if filt:
+            custom_metrics[k + "_min"] = np.min(filt)
+            custom_metrics[k + "_max"] = np.max(filt)
+        else:
+            custom_metrics[k + "_min"] = float("nan")
+            custom_metrics[k + "_max"] = float("nan")
+        del custom_metrics[k]
+
     return dict(
         episode_reward_max=max_reward,
         episode_reward_min=min_reward,
         episode_reward_mean=avg_reward,
         episode_len_mean=avg_length,
         episodes_this_iter=len(new_episodes),
-        policy_reward_mean=dict(policy_rewards))
+        policy_reward_mean=dict(policy_rewards),
+        custom_metrics=dict(custom_metrics),
+        num_metric_batches_dropped=num_dropped)
diff --git a/python/ray/rllib/evaluation/policy_evaluator.py b/python/ray/rllib/evaluation/policy_evaluator.py
index 24eb746100d56..b97f6a27bd00c 100644
--- a/python/ray/rllib/evaluation/policy_evaluator.py
+++ b/python/ray/rllib/evaluation/policy_evaluator.py
@@ -3,27 +3,31 @@
 from __future__ import print_function
 
 import gym
+import logging
 import pickle
 import tensorflow as tf
 
 import ray
-from ray.rllib.models import ModelCatalog
 from ray.rllib.env.async_vector_env import AsyncVectorEnv
 from ray.rllib.env.atari_wrappers import wrap_deepmind, is_atari
 from ray.rllib.env.env_context import EnvContext
-from ray.rllib.env.serving_env import ServingEnv
-from ray.rllib.env.vector_env import VectorEnv
 from ray.rllib.env.multi_agent_env import MultiAgentEnv
 from ray.rllib.evaluation.interface import EvaluatorInterface
 from ray.rllib.evaluation.sample_batch import MultiAgentBatch, \
     DEFAULT_POLICY_ID
 from ray.rllib.evaluation.sampler import AsyncSampler, SyncSampler
-from ray.rllib.utils.compression import pack
-from ray.rllib.utils.filter import get_filter
 from ray.rllib.evaluation.policy_graph import PolicyGraph
 from ray.rllib.evaluation.tf_policy_graph import TFPolicyGraph
+from ray.rllib.models import ModelCatalog
+from ray.rllib.models.preprocessors import NoPreprocessor
+from ray.rllib.utils import merge_dicts
+from ray.rllib.utils.annotations import override
+from ray.rllib.utils.compression import pack
+from ray.rllib.utils.filter import get_filter
 from ray.rllib.utils.tf_run_builder import TFRunBuilder
 
+logger = logging.getLogger(__name__)
+
 
 class PolicyEvaluator(EvaluatorInterface):
     """Common ``PolicyEvaluator`` implementation that wraps a ``PolicyGraph``.
@@ -71,7 +75,7 @@ class PolicyEvaluator(EvaluatorInterface):
         ...   policy_mapping_fn=lambda agent_id:
         ...     random.choice(["car_policy1", "car_policy2"])
         ...     if agent_id.startswith("car_") else "traffic_light_policy")
-        >>> print(evaluator.sample().keys())
+        >>> print(evaluator.sample())
         MultiAgentBatch({
             "car_policy1": SampleBatch(...),
             "car_policy2": SampleBatch(...),
@@ -79,8 +83,9 @@ class PolicyEvaluator(EvaluatorInterface):
     """
 
     @classmethod
-    def as_remote(cls, num_cpus=None, num_gpus=None):
-        return ray.remote(num_cpus=num_cpus, num_gpus=num_gpus)(cls)
+    def as_remote(cls, num_cpus=None, num_gpus=None, resources=None):
+        return ray.remote(
+            num_cpus=num_cpus, num_gpus=num_gpus, resources=resources)(cls)
 
     def __init__(self,
                  env_creator,
@@ -97,11 +102,14 @@ def __init__(self,
                  num_envs=1,
                  observation_filter="NoFilter",
                  clip_rewards=None,
+                 clip_actions=True,
                  env_config=None,
                  model_config=None,
                  policy_config=None,
                  worker_index=0,
-                 monitor_path=None):
+                 monitor_path=None,
+                 log_level=None,
+                 callbacks=None):
         """Initialize a policy evaluator.
 
         Arguments:
@@ -124,16 +132,14 @@ def __init__(self,
                 in each sample batch returned from this evaluator.
             batch_mode (str): One of the following batch modes:
                 "truncate_episodes": Each call to sample() will return a batch
-                    of at most `batch_steps` in size. The batch will be exactly
-                    `batch_steps` in size if postprocessing does not change
-                    batch sizes. Episodes may be truncated in order to meet
-                    this size requirement. When `num_envs > 1`, episodes will
-                    be truncated to sequences of `batch_size / num_envs` in
-                    length.
+                    of at most `batch_steps * num_envs` in size. The batch will
+                    be exactly `batch_steps * num_envs` in size if
+                    postprocessing does not change batch sizes. Episodes may be
+                    truncated in order to meet this size requirement.
                 "complete_episodes": Each call to sample() will return a batch
-                    of at least `batch_steps in size. Episodes will not be
-                    truncated, but multiple episodes may be packed within one
-                    batch to meet the batch size. Note that when
+                    of at least `batch_steps * num_envs` in size. Episodes will
+                    not be truncated, but multiple episodes may be packed
+                    within one batch to meet the batch size. Note that when
                     `num_envs > 1`, episode steps will be buffered until the
                     episode completes, and hence batches may contain
                     significant amounts of off-policy data.
@@ -152,6 +158,8 @@ def __init__(self,
             clip_rewards (bool): Whether to clip rewards to [-1, 1] prior to
                 experience postprocessing. Setting to None means clip for Atari
                 only.
+            clip_actions (bool): Whether to clip action values to the range
+                specified by the policy action space.
             env_config (dict): Config to pass to the env creator.
             model_config (dict): Config to use when creating the policy model.
             policy_config (dict): Config to pass to the policy. In the
@@ -162,48 +170,58 @@ def __init__(self,
                 through EnvContext so that envs can be configured per worker.
             monitor_path (str): Write out episode stats and videos to this
                 directory if specified.
+            log_level (str): Set the root log level on creation.
+            callbacks (dict): Dict of custom debug callbacks.
         """
 
+        if log_level:
+            logging.getLogger("ray.rllib").setLevel(log_level)
+
         env_context = EnvContext(env_config or {}, worker_index)
         policy_config = policy_config or {}
         self.policy_config = policy_config
+        self.callbacks = callbacks or {}
         model_config = model_config or {}
         policy_mapping_fn = (policy_mapping_fn
                              or (lambda agent_id: DEFAULT_POLICY_ID))
+        if not callable(policy_mapping_fn):
+            raise ValueError(
+                "Policy mapping function not callable. If you're using Tune, "
+                "make sure to escape the function with tune.function() "
+                "to prevent it from being evaluated as an expression.")
         self.env_creator = env_creator
-        self.batch_steps = batch_steps
+        self.sample_batch_size = batch_steps * num_envs
         self.batch_mode = batch_mode
         self.compress_observations = compress_observations
+        self.preprocessing_enabled = True
 
         self.env = env_creator(env_context)
-        if isinstance(self.env, VectorEnv) or \
-                isinstance(self.env, ServingEnv) or \
-                isinstance(self.env, MultiAgentEnv) or \
+        if isinstance(self.env, MultiAgentEnv) or \
                 isinstance(self.env, AsyncVectorEnv):
 
             def wrap(env):
                 return env  # we can't auto-wrap these env types
         elif is_atari(self.env) and \
-                "custom_preprocessor" not in model_config and \
+                not model_config.get("custom_preprocessor") and \
                 preprocessor_pref == "deepmind":
 
+            # Deepmind wrappers already handle all preprocessing
+            self.preprocessing_enabled = False
+
             if clip_rewards is None:
                 clip_rewards = True
 
             def wrap(env):
                 env = wrap_deepmind(
                     env,
-                    dim=model_config.get("dim", 84),
-                    framestack=not model_config.get("use_lstm")
-                    and not model_config.get("no_framestack"))
+                    dim=model_config.get("dim"),
+                    framestack=model_config.get("framestack"))
                 if monitor_path:
                     env = _monitor(env, monitor_path)
                 return env
         else:
 
             def wrap(env):
-                env = ModelCatalog.get_preprocessor_as_wrapper(
-                    env, model_config)
                 if monitor_path:
                     env = _monitor(env, monitor_path)
                 return env
@@ -226,13 +244,20 @@ def make_env(vector_index):
                         config=tf.ConfigProto(
                             gpu_options=tf.GPUOptions(allow_growth=True)))
                 with self.tf_sess.as_default():
-                    self.policy_map = self._build_policy_map(
-                        policy_dict, policy_config)
+                    self.policy_map, self.preprocessors = \
+                        self._build_policy_map(policy_dict, policy_config)
         else:
-            self.policy_map = self._build_policy_map(policy_dict,
-                                                     policy_config)
+            self.policy_map, self.preprocessors = self._build_policy_map(
+                policy_dict, policy_config)
 
-        self.multiagent = self.policy_map.keys() != {DEFAULT_POLICY_ID}
+        self.multiagent = set(self.policy_map.keys()) != {DEFAULT_POLICY_ID}
+        if self.multiagent:
+            if not (isinstance(self.env, MultiAgentEnv)
+                    or isinstance(self.env, AsyncVectorEnv)):
+                raise ValueError(
+                    "Have multiple policy graphs {}, but the env ".format(
+                        self.policy_map) +
+                    "{} is not a subclass of MultiAgentEnv?".format(self.env))
 
         self.filters = {
             policy_id: get_filter(observation_filter,
@@ -246,15 +271,10 @@ def make_env(vector_index):
         self.num_envs = num_envs
 
         if self.batch_mode == "truncate_episodes":
-            if batch_steps % num_envs != 0:
-                raise ValueError(
-                    "In 'truncate_episodes' batch mode, `batch_steps` must be "
-                    "evenly divisible by `num_envs`. Got {} and {}.".format(
-                        batch_steps, num_envs))
-            batch_steps = batch_steps // num_envs
+            unroll_length = batch_steps
             pack_episodes = True
         elif self.batch_mode == "complete_episodes":
-            batch_steps = float("inf")  # never cut episodes
+            unroll_length = float("inf")  # never cut episodes
             pack_episodes = False  # sampler will return 1 episode per poll
         else:
             raise ValueError("Unsupported batch mode: {}".format(
@@ -264,35 +284,35 @@ def make_env(vector_index):
                 self.async_env,
                 self.policy_map,
                 policy_mapping_fn,
+                self.preprocessors,
                 self.filters,
                 clip_rewards,
-                batch_steps,
+                unroll_length,
+                self.callbacks,
                 horizon=episode_horizon,
                 pack=pack_episodes,
-                tf_sess=self.tf_sess)
+                tf_sess=self.tf_sess,
+                clip_actions=clip_actions)
             self.sampler.start()
         else:
             self.sampler = SyncSampler(
                 self.async_env,
                 self.policy_map,
                 policy_mapping_fn,
+                self.preprocessors,
                 self.filters,
                 clip_rewards,
-                batch_steps,
+                unroll_length,
+                self.callbacks,
                 horizon=episode_horizon,
                 pack=pack_episodes,
-                tf_sess=self.tf_sess)
+                tf_sess=self.tf_sess,
+                clip_actions=clip_actions)
 
-    def _build_policy_map(self, policy_dict, policy_config):
-        policy_map = {}
-        for name, (cls, obs_space, act_space,
-                   conf) in sorted(policy_dict.items()):
-            merged_conf = policy_config.copy()
-            merged_conf.update(conf)
-            with tf.variable_scope(name):
-                policy_map[name] = cls(obs_space, act_space, merged_conf)
-        return policy_map
+        logger.debug("Created evaluator with env {} ({}), policies {}".format(
+            self.async_env, self.env, self.policy_map))
 
+    @override(EvaluatorInterface)
     def sample(self):
         """Evaluate the current policies and return a batch of experiences.
 
@@ -310,13 +330,20 @@ def sample(self):
         else:
             max_batches = float("inf")
 
-        while steps_so_far < self.batch_steps and len(batches) < max_batches:
+        while steps_so_far < self.sample_batch_size and len(
+                batches) < max_batches:
             batch = self.sampler.get_data()
             steps_so_far += batch.count
             batches.append(batch)
         batches.extend(self.sampler.get_extra_batches())
         batch = batches[0].concat_samples(batches)
 
+        if self.callbacks.get("on_sample_end"):
+            self.callbacks["on_sample_end"]({
+                "evaluator": self,
+                "samples": batch
+            })
+
         if self.compress_observations:
             if isinstance(batch, MultiAgentBatch):
                 for data in batch.policy_batches.values():
@@ -334,52 +361,7 @@ def sample_with_count(self):
         batch = self.sample()
         return batch, batch.count
 
-    def for_policy(self, func, policy_id=DEFAULT_POLICY_ID):
-        """Apply the given function to the specified policy graph."""
-
-        return func(self.policy_map[policy_id])
-
-    def foreach_policy(self, func):
-        """Apply the given function to each (policy, policy_id) tuple."""
-
-        return [func(policy, pid) for pid, policy in self.policy_map.items()]
-
-    def foreach_trainable_policy(self, func):
-        """Apply the given function to each (policy, policy_id) tuple.
-
-        This only applies func to policies in `self.policies_to_train`."""
-
-        return [
-            func(policy, pid) for pid, policy in self.policy_map.items()
-            if pid in self.policies_to_train
-        ]
-
-    def sync_filters(self, new_filters):
-        """Changes self's filter to given and rebases any accumulated delta.
-
-        Args:
-            new_filters (dict): Filters with new state to update local copy.
-        """
-        assert all(k in new_filters for k in self.filters)
-        for k in self.filters:
-            self.filters[k].sync(new_filters[k])
-
-    def get_filters(self, flush_after=False):
-        """Returns a snapshot of filters.
-
-        Args:
-            flush_after (bool): Clears the filter buffer state.
-
-        Returns:
-            return_filters (dict): Dict for serializable filters
-        """
-        return_filters = {}
-        for k, f in self.filters.items():
-            return_filters[k] = f.as_serializable()
-            if flush_after:
-                f.clear_buffer()
-        return return_filters
-
+    @override(EvaluatorInterface)
     def get_weights(self, policies=None):
         if policies is None:
             policies = self.policy_map.keys()
@@ -388,10 +370,12 @@ def get_weights(self, policies=None):
             for pid, policy in self.policy_map.items() if pid in policies
         }
 
+    @override(EvaluatorInterface)
     def set_weights(self, weights):
         for pid, w in weights.items():
             self.policy_map[pid].set_weights(w)
 
+    @override(EvaluatorInterface)
     def compute_gradients(self, samples):
         if isinstance(samples, MultiAgentBatch):
             grad_out, info_out = {}, {}
@@ -401,12 +385,14 @@ def compute_gradients(self, samples):
                     if pid not in self.policies_to_train:
                         continue
                     grad_out[pid], info_out[pid] = (
-                        self.policy_map[pid].build_compute_gradients(
+                        self.policy_map[pid]._build_compute_gradients(
                             builder, batch))
                 grad_out = {k: builder.get(v) for k, v in grad_out.items()}
                 info_out = {k: builder.get(v) for k, v in info_out.items()}
             else:
                 for pid, batch in samples.policy_batches.items():
+                    if pid not in self.policies_to_train:
+                        continue
                     grad_out[pid], info_out[pid] = (
                         self.policy_map[pid].compute_gradients(batch))
         else:
@@ -415,12 +401,13 @@ def compute_gradients(self, samples):
         info_out["batch_count"] = samples.count
         return grad_out, info_out
 
+    @override(EvaluatorInterface)
     def apply_gradients(self, grads):
         if isinstance(grads, dict):
             if self.tf_sess is not None:
                 builder = TFRunBuilder(self.tf_sess, "apply_gradients")
                 outputs = {
-                    pid: self.policy_map[pid].build_apply_gradients(
+                    pid: self.policy_map[pid]._build_apply_gradients(
                         builder, grad)
                     for pid, grad in grads.items()
                 }
@@ -433,6 +420,7 @@ def apply_gradients(self, grads):
         else:
             return self.policy_map[DEFAULT_POLICY_ID].apply_gradients(grads)
 
+    @override(EvaluatorInterface)
     def compute_apply(self, samples):
         if isinstance(samples, MultiAgentBatch):
             info_out = {}
@@ -442,11 +430,13 @@ def compute_apply(self, samples):
                     if pid not in self.policies_to_train:
                         continue
                     info_out[pid], _ = (
-                        self.policy_map[pid].build_compute_apply(
+                        self.policy_map[pid]._build_compute_apply(
                             builder, batch))
                 info_out = {k: builder.get(v) for k, v in info_out.items()}
             else:
                 for pid, batch in samples.policy_batches.items():
+                    if pid not in self.policies_to_train:
+                        continue
                     info_out[pid], _ = (
                         self.policy_map[pid].compute_apply(batch))
             return info_out
@@ -455,6 +445,52 @@ def compute_apply(self, samples):
                 self.policy_map[DEFAULT_POLICY_ID].compute_apply(samples))
             return grad_fetch
 
+    def for_policy(self, func, policy_id=DEFAULT_POLICY_ID):
+        """Apply the given function to the specified policy graph."""
+
+        return func(self.policy_map[policy_id])
+
+    def foreach_policy(self, func):
+        """Apply the given function to each (policy, policy_id) tuple."""
+
+        return [func(policy, pid) for pid, policy in self.policy_map.items()]
+
+    def foreach_trainable_policy(self, func):
+        """Apply the given function to each (policy, policy_id) tuple.
+
+        This only applies func to policies in `self.policies_to_train`."""
+
+        return [
+            func(policy, pid) for pid, policy in self.policy_map.items()
+            if pid in self.policies_to_train
+        ]
+
+    def sync_filters(self, new_filters):
+        """Changes self's filter to given and rebases any accumulated delta.
+
+        Args:
+            new_filters (dict): Filters with new state to update local copy.
+        """
+        assert all(k in new_filters for k in self.filters)
+        for k in self.filters:
+            self.filters[k].sync(new_filters[k])
+
+    def get_filters(self, flush_after=False):
+        """Returns a snapshot of filters.
+
+        Args:
+            flush_after (bool): Clears the filter buffer state.
+
+        Returns:
+            return_filters (dict): Dict for serializable filters
+        """
+        return_filters = {}
+        for k, f in self.filters.items():
+            return_filters[k] = f.as_serializable()
+            if flush_after:
+                f.clear_buffer()
+        return return_filters
+
     def save(self):
         filters = self.get_filters(flush_after=True)
         state = {
@@ -472,6 +508,29 @@ def restore(self, objs):
     def set_global_vars(self, global_vars):
         self.foreach_policy(lambda p, _: p.on_global_var_update(global_vars))
 
+    def _build_policy_map(self, policy_dict, policy_config):
+        policy_map = {}
+        preprocessors = {}
+        for name, (cls, obs_space, act_space,
+                   conf) in sorted(policy_dict.items()):
+            merged_conf = merge_dicts(policy_config, conf)
+            if self.preprocessing_enabled:
+                preprocessor = ModelCatalog.get_preprocessor_for_space(
+                    obs_space, merged_conf.get("model"))
+                preprocessors[name] = preprocessor
+                obs_space = preprocessor.observation_space
+            else:
+                preprocessors[name] = NoPreprocessor(obs_space)
+            if isinstance(obs_space, gym.spaces.Dict) or \
+                    isinstance(obs_space, gym.spaces.Tuple):
+                raise ValueError(
+                    "Found raw Tuple|Dict space as input to policy graph. "
+                    "Please preprocess these observations with a "
+                    "Tuple|DictFlatteningPreprocessor.")
+            with tf.variable_scope(name):
+                policy_map[name] = cls(obs_space, act_space, merged_conf)
+        return policy_map, preprocessors
+
 
 def _validate_and_canonicalize(policy_graph, env):
     if isinstance(policy_graph, dict):
@@ -503,6 +562,11 @@ def _validate_and_canonicalize(policy_graph, env):
     elif not issubclass(policy_graph, PolicyGraph):
         raise ValueError("policy_graph must be a rllib.PolicyGraph class")
     else:
+        if (isinstance(env, MultiAgentEnv)
+                and not hasattr(env, "observation_space")):
+            raise ValueError(
+                "MultiAgentEnv must have observation_space defined if run "
+                "in a single-agent configuration.")
         return {
             DEFAULT_POLICY_ID: (policy_graph, env.observation_space,
                                 env.action_space, {})
diff --git a/python/ray/rllib/evaluation/policy_graph.py b/python/ray/rllib/evaluation/policy_graph.py
index 925fa70aa1545..c19da286b0b9a 100644
--- a/python/ray/rllib/evaluation/policy_graph.py
+++ b/python/ray/rllib/evaluation/policy_graph.py
@@ -40,14 +40,16 @@ class you pass into PolicyEvaluator will be constructed with
     def compute_actions(self,
                         obs_batch,
                         state_batches,
-                        is_training=False,
+                        prev_action_batch=None,
+                        prev_reward_batch=None,
                         episodes=None):
         """Compute actions for the current policy.
 
         Arguments:
             obs_batch (np.ndarray): batch of observations
             state_batches (list): list of RNN state input batches, if any
-            is_training (bool): whether we are training the policy
+            prev_action_batch (np.ndarray): batch of previous action values
+            prev_reward_batch (np.ndarray): batch of previous rewards
             episodes (list): MultiAgentEpisode for each obs in obs_batch.
                 This provides access to all of the internal episode state,
                 which may be useful for model-based or multiagent algorithms.
@@ -65,17 +67,19 @@ def compute_actions(self,
     def compute_single_action(self,
                               obs,
                               state,
-                              is_training=False,
+                              prev_action_batch=None,
+                              prev_reward_batch=None,
                               episode=None):
         """Unbatched version of compute_actions.
 
         Arguments:
             obs (obj): single observation
             state_batches (list): list of RNN state inputs, if any
-            is_training (bool): whether we are training the policy
+            prev_action_batch (np.ndarray): batch of previous action values
+            prev_reward_batch (np.ndarray): batch of previous rewards
             episode (MultiAgentEpisode): this provides access to all of the
                 internal episode state, which may be useful for model-based or
-                multiagent algorithms.
+                multi-agent algorithms.
 
         Returns:
             actions (obj): single action
@@ -84,11 +88,14 @@ def compute_single_action(self,
         """
 
         [action], state_out, info = self.compute_actions(
-            [obs], [[s] for s in state], is_training, episodes=[episode])
+            [obs], [[s] for s in state], episodes=[episode])
         return action, [s[0] for s in state_out], \
             {k: v[0] for k, v in info.items()}
 
-    def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
+    def postprocess_trajectory(self,
+                               sample_batch,
+                               other_agent_batches=None,
+                               episode=None):
         """Implements algorithm-specific trajectory postprocessing.
 
         This will be called on each trajectory fragment computed during policy
@@ -100,6 +107,9 @@ def postprocess_trajectory(self, sample_batch, other_agent_batches=None):
             other_agent_batches (dict): In a multi-agent env, this contains a
                 mapping of agent ids to (policy_graph, agent_batch) tuples
                 containing the policy graph and experiences of the other agent.
+            episode (MultiAgentEpisode): this provides access to all of the
+                internal episode state, which may be useful for model-based or
+                multi-agent algorithms.
 
         Returns:
             SampleBatch: postprocessed sample batch.
diff --git a/python/ray/rllib/evaluation/sample_batch.py b/python/ray/rllib/evaluation/sample_batch.py
index f8f88a4aae314..5a0099530705f 100644
--- a/python/ray/rllib/evaluation/sample_batch.py
+++ b/python/ray/rllib/evaluation/sample_batch.py
@@ -79,6 +79,11 @@ def __init__(self, policy_map, clip_rewards):
         self.agent_to_policy = {}
         self.count = 0  # increment this manually
 
+    def total(self):
+        """Returns summed number of steps across all agent buffers."""
+
+        return sum(p.count for p in self.policy_builders.values())
+
     def has_pending_data(self):
         """Returns whether there is pending unprocessed data."""
 
@@ -99,11 +104,14 @@ def add_values(self, agent_id, policy_id, **values):
         builder = self.agent_builders[agent_id]
         builder.add_values(**values)
 
-    def postprocess_batch_so_far(self):
+    def postprocess_batch_so_far(self, episode):
         """Apply policy postprocessors to any unprocessed rows.
 
         This pushes the postprocessed per-agent batches onto the per-policy
         builders, clearing per-agent state.
+
+        Arguments:
+            episode: current MultiAgentEpisode object or None
         """
 
         # Materialize the batches so far
@@ -128,7 +136,7 @@ def postprocess_batch_so_far(self):
                     "Batches sent to postprocessing must only contain steps "
                     "from a single trajectory.", pre_batch)
             post_batches[agent_id] = policy.postprocess_trajectory(
-                pre_batch, other_batches)
+                pre_batch, other_batches, episode)
 
         # Append into policy batches and reset
         for agent_id, post_batch in sorted(post_batches.items()):
@@ -137,14 +145,17 @@ def postprocess_batch_so_far(self):
         self.agent_builders.clear()
         self.agent_to_policy.clear()
 
-    def build_and_reset(self):
+    def build_and_reset(self, episode):
         """Returns the accumulated sample batches for each policy.
 
         Any unprocessed rows will be first postprocessed with a policy
         postprocessor. The internal state of this builder will be reset.
+
+        Arguments:
+            episode: current MultiAgentEpisode object or None
         """
 
-        self.postprocess_batch_so_far()
+        self.postprocess_batch_so_far(episode)
         policy_batches = {}
         for policy_id, builder in self.policy_builders.items():
             if builder.count > 0:
@@ -189,6 +200,11 @@ def concat_samples(samples):
             out[policy_id] = SampleBatch.concat_samples(batches)
         return MultiAgentBatch(out, total_count)
 
+    def copy(self):
+        return MultiAgentBatch(
+            {k: v.copy()
+             for (k, v) in self.policy_batches.items()}, self.count)
+
     def total(self):
         ct = 0
         for batch in self.policy_batches.values():
@@ -250,6 +266,11 @@ def concat(self, other):
             out[k] = np.concatenate([self[k], other[k]])
         return SampleBatch(out)
 
+    def copy(self):
+        return SampleBatch(
+            {k: np.array(v, copy=True)
+             for (k, v) in self.data.items()})
+
     def rows(self):
         """Returns an iterator over data rows, i.e. dicts with column values.
 
diff --git a/python/ray/rllib/evaluation/sampler.py b/python/ray/rllib/evaluation/sampler.py
index f41c3ca739e21..ac7c6ed8a7ea8 100644
--- a/python/ray/rllib/evaluation/sampler.py
+++ b/python/ray/rllib/evaluation/sampler.py
@@ -2,23 +2,32 @@
 from __future__ import division
 from __future__ import print_function
 
+import gym
 from collections import defaultdict, namedtuple
+import logging
+import numpy as np
 import six.moves.queue as queue
 import threading
 
-from ray.rllib.evaluation.episode import MultiAgentEpisode
+from ray.rllib.evaluation.episode import MultiAgentEpisode, _flatten_action
 from ray.rllib.evaluation.sample_batch import MultiAgentSampleBatchBuilder, \
     MultiAgentBatch
 from ray.rllib.evaluation.tf_policy_graph import TFPolicyGraph
 from ray.rllib.env.async_vector_env import AsyncVectorEnv
 from ray.rllib.env.atari_wrappers import get_wrapper_by_cls, MonitorEnv
+from ray.rllib.models.action_dist import TupleActions
 from ray.rllib.utils.tf_run_builder import TFRunBuilder
 
+logger = logging.getLogger(__name__)
+_large_batch_warned = False
+
 RolloutMetrics = namedtuple(
-    "RolloutMetrics", ["episode_length", "episode_reward", "agent_rewards"])
+    "RolloutMetrics",
+    ["episode_length", "episode_reward", "agent_rewards", "custom_metrics"])
 
-PolicyEvalData = namedtuple("PolicyEvalData",
-                            ["env_id", "agent_id", "obs", "rnn_state"])
+PolicyEvalData = namedtuple(
+    "PolicyEvalData",
+    ["env_id", "agent_id", "obs", "rnn_state", "prev_action", "prev_reward"])
 
 
 class SyncSampler(object):
@@ -34,23 +43,28 @@ def __init__(self,
                  env,
                  policies,
                  policy_mapping_fn,
+                 preprocessors,
                  obs_filters,
                  clip_rewards,
-                 num_local_steps,
+                 unroll_length,
+                 callbacks,
                  horizon=None,
                  pack=False,
-                 tf_sess=None):
+                 tf_sess=None,
+                 clip_actions=True):
         self.async_vector_env = AsyncVectorEnv.wrap_async(env)
-        self.num_local_steps = num_local_steps
+        self.unroll_length = unroll_length
         self.horizon = horizon
         self.policies = policies
         self.policy_mapping_fn = policy_mapping_fn
-        self._obs_filters = obs_filters
+        self.preprocessors = preprocessors
+        self.obs_filters = obs_filters
         self.extra_batches = queue.Queue()
         self.rollout_provider = _env_runner(
             self.async_vector_env, self.extra_batches.put, self.policies,
-            self.policy_mapping_fn, self.num_local_steps, self.horizon,
-            self._obs_filters, clip_rewards, pack, tf_sess)
+            self.policy_mapping_fn, self.unroll_length, self.horizon,
+            self.preprocessors, self.obs_filters, clip_rewards, clip_actions,
+            pack, callbacks, tf_sess)
         self.metrics_queue = queue.Queue()
 
     def get_data(self):
@@ -90,12 +104,15 @@ def __init__(self,
                  env,
                  policies,
                  policy_mapping_fn,
+                 preprocessors,
                  obs_filters,
                  clip_rewards,
-                 num_local_steps,
+                 unroll_length,
+                 callbacks,
                  horizon=None,
                  pack=False,
-                 tf_sess=None):
+                 tf_sess=None,
+                 clip_actions=True):
         for _, f in obs_filters.items():
             assert getattr(f, "is_concurrent", False), \
                 "Observation Filter must support concurrent updates."
@@ -104,15 +121,18 @@ def __init__(self,
         self.queue = queue.Queue(5)
         self.extra_batches = queue.Queue()
         self.metrics_queue = queue.Queue()
-        self.num_local_steps = num_local_steps
+        self.unroll_length = unroll_length
         self.horizon = horizon
         self.policies = policies
         self.policy_mapping_fn = policy_mapping_fn
-        self._obs_filters = obs_filters
+        self.preprocessors = preprocessors
+        self.obs_filters = obs_filters
         self.clip_rewards = clip_rewards
         self.daemon = True
         self.pack = pack
         self.tf_sess = tf_sess
+        self.callbacks = callbacks
+        self.clip_actions = clip_actions
 
     def run(self):
         try:
@@ -124,8 +144,9 @@ def run(self):
     def _run(self):
         rollout_provider = _env_runner(
             self.async_vector_env, self.extra_batches.put, self.policies,
-            self.policy_mapping_fn, self.num_local_steps, self.horizon,
-            self._obs_filters, self.clip_rewards, self.pack, self.tf_sess)
+            self.policy_mapping_fn, self.unroll_length, self.horizon,
+            self.preprocessors, self.obs_filters, self.clip_rewards,
+            self.clip_actions, self.pack, self.callbacks, self.tf_sess)
         while True:
             # The timeout variable exists because apparently, if one worker
             # dies, the other workers won't die with it, unless the timeout is
@@ -182,11 +203,14 @@ def _env_runner(async_vector_env,
                 extra_batch_callback,
                 policies,
                 policy_mapping_fn,
-                num_local_steps,
+                unroll_length,
                 horizon,
+                preprocessors,
                 obs_filters,
                 clip_rewards,
+                clip_actions,
                 pack,
+                callbacks,
                 tf_sess=None):
     """This implements the common experience collection logic.
 
@@ -197,14 +221,18 @@ def _env_runner(async_vector_env,
         policy_mapping_fn (func): Function that maps agent ids to policy ids.
             This is called when an agent first enters the environment. The
             agent is then "bound" to the returned policy for the episode.
-        num_local_steps (int): Number of episode steps before `SampleBatch` is
+        unroll_length (int): Number of episode steps before `SampleBatch` is
             yielded. Set to infinity to yield complete episodes.
         horizon (int): Horizon of the episode.
+        preprocessors (dict): Map of policy id to preprocessor for the
+            observations prior to filtering.
         obs_filters (dict): Map of policy id to filter used to process
             observations for the policy.
         clip_rewards (bool): Whether to clip rewards before postprocessing.
         pack (bool): Whether to pack multiple episodes into each batch. This
-            guarantees batches will be exactly `num_local_steps` in size.
+            guarantees batches will be exactly `unroll_length` in size.
+        clip_actions (bool): Whether to clip actions to the space range.
+        callbacks (dict): User callbacks to run on episode events.
         tf_sess (Session|None): Optional tensorflow session to use for batching
             TF policy evaluations.
 
@@ -218,7 +246,7 @@ def _env_runner(async_vector_env,
             horizon = (
                 async_vector_env.get_unwrapped()[0].spec.max_episode_steps)
     except Exception:
-        print("Warning, no horizon specified, assuming infinite")
+        logger.warn("no episode horizon specified, assuming inf")
     if not horizon:
         horizon = float("inf")
 
@@ -233,8 +261,14 @@ def get_batch_builder():
             return MultiAgentSampleBatchBuilder(policies, clip_rewards)
 
     def new_episode():
-        return MultiAgentEpisode(policies, policy_mapping_fn,
-                                 get_batch_builder, extra_batch_callback)
+        episode = MultiAgentEpisode(policies, policy_mapping_fn,
+                                    get_batch_builder, extra_batch_callback)
+        if callbacks.get("on_episode_start"):
+            callbacks["on_episode_start"]({
+                "env": async_vector_env,
+                "episode": episode
+            })
+        return episode
 
     active_episodes = defaultdict(new_episode)
 
@@ -243,152 +277,267 @@ def new_episode():
         unfiltered_obs, rewards, dones, infos, off_policy_actions = \
             async_vector_env.poll()
 
-        # Map of policy_id to list of PolicyEvalData
-        to_eval = defaultdict(list)
+        # Process observations and prepare for policy evaluation
+        active_envs, to_eval, outputs = _process_observations(
+            async_vector_env, policies, batch_builder_pool, active_episodes,
+            unfiltered_obs, rewards, dones, infos, off_policy_actions, horizon,
+            preprocessors, obs_filters, unroll_length, pack, callbacks)
+        for o in outputs:
+            yield o
 
-        # Map of env_id -> agent_id -> action replies
-        actions_to_send = defaultdict(dict)
+        # Do batched policy eval
+        eval_results = _do_policy_eval(tf_sess, to_eval, policies,
+                                       active_episodes, clip_actions)
 
-        # For each environment
-        for env_id, agent_obs in unfiltered_obs.items():
-            new_episode = env_id not in active_episodes
-            episode = active_episodes[env_id]
-            if not new_episode:
-                episode.length += 1
-                episode.batch_builder.count += 1
-                episode._add_agent_rewards(rewards[env_id])
-
-            # Check episode termination conditions
-            if dones[env_id]["__all__"] or episode.length >= horizon:
-                all_done = True
-                atari_metrics = _fetch_atari_metrics(async_vector_env)
-                if atari_metrics is not None:
-                    for m in atari_metrics:
-                        yield m
-                else:
-                    yield RolloutMetrics(episode.length, episode.total_reward,
-                                         dict(episode.agent_rewards))
+        # Process results and update episode state
+        actions_to_send = _process_policy_eval_results(
+            to_eval, eval_results, active_episodes, active_envs,
+            off_policy_actions)
+
+        # Return computed actions to ready envs. We also send to envs that have
+        # taken off-policy actions; those envs are free to ignore the action.
+        async_vector_env.send_actions(actions_to_send)
+
+
+def _process_observations(async_vector_env, policies, batch_builder_pool,
+                          active_episodes, unfiltered_obs, rewards, dones,
+                          infos, off_policy_actions, horizon, preprocessors,
+                          obs_filters, unroll_length, pack, callbacks):
+    """Record new data from the environment and prepare for policy evaluation.
+
+    Returns:
+        active_envs: set of non-terminated env ids
+        to_eval: map of policy_id to list of agent PolicyEvalData
+        outputs: list of metrics and samples to return from the sampler
+    """
+
+    active_envs = set()
+    to_eval = defaultdict(list)
+    outputs = []
+
+    # For each environment
+    for env_id, agent_obs in unfiltered_obs.items():
+        new_episode = env_id not in active_episodes
+        episode = active_episodes[env_id]
+        if not new_episode:
+            episode.length += 1
+            episode.batch_builder.count += 1
+            episode._add_agent_rewards(rewards[env_id])
+
+        global _large_batch_warned
+        if (not _large_batch_warned and
+                episode.batch_builder.total() > max(1000, unroll_length * 10)):
+            _large_batch_warned = True
+            logger.warn(
+                "More than {} observations for {} env steps ".format(
+                    episode.batch_builder.total(),
+                    episode.batch_builder.count) + "are buffered in "
+                "the sampler. If this is not intentional, check that the "
+                "the `horizon` config is set correctly, or consider setting "
+                "`batch_mode` to 'truncate_episodes'. Note that in "
+                "multi-agent environments, `sample_batch_size` sets the "
+                "batch size based on environment steps, not the steps of "
+                "individual agents.")
+
+        # Check episode termination conditions
+        if dones[env_id]["__all__"] or episode.length >= horizon:
+            all_done = True
+            atari_metrics = _fetch_atari_metrics(async_vector_env)
+            if atari_metrics is not None:
+                for m in atari_metrics:
+                    outputs.append(
+                        m._replace(custom_metrics=episode.custom_metrics))
+            else:
+                outputs.append(
+                    RolloutMetrics(episode.length, episode.total_reward,
+                                   dict(episode.agent_rewards),
+                                   episode.custom_metrics))
+        else:
+            all_done = False
+            active_envs.add(env_id)
+
+        # For each agent in the environment
+        for agent_id, raw_obs in agent_obs.items():
+            policy_id = episode.policy_for(agent_id)
+            prep_obs = _get_or_raise(preprocessors,
+                                     policy_id).transform(raw_obs)
+            filtered_obs = _get_or_raise(obs_filters, policy_id)(prep_obs)
+            agent_done = bool(all_done or dones[env_id].get(agent_id))
+            if not agent_done:
+                to_eval[policy_id].append(
+                    PolicyEvalData(env_id, agent_id, filtered_obs,
+                                   episode.rnn_state_for(agent_id),
+                                   episode.last_action_for(agent_id),
+                                   rewards[env_id][agent_id] or 0.0))
+
+            last_observation = episode.last_observation_for(agent_id)
+            episode._set_last_observation(agent_id, filtered_obs)
+            episode._set_last_info(agent_id, infos[env_id][agent_id])
+
+            # Record transition info if applicable
+            if last_observation is not None and \
+                    infos[env_id][agent_id].get("training_enabled", True):
+                episode.batch_builder.add_values(
+                    agent_id,
+                    policy_id,
+                    t=episode.length - 1,
+                    eps_id=episode.episode_id,
+                    agent_index=episode._agent_index(agent_id),
+                    obs=last_observation,
+                    actions=episode.last_action_for(agent_id),
+                    rewards=rewards[env_id][agent_id],
+                    prev_actions=episode.prev_action_for(agent_id),
+                    prev_rewards=episode.prev_reward_for(agent_id),
+                    dones=agent_done,
+                    infos=infos[env_id][agent_id],
+                    new_obs=filtered_obs,
+                    **episode.last_pi_info_for(agent_id))
+
+        # Invoke the step callback after the step is logged to the episode
+        if callbacks.get("on_episode_step"):
+            callbacks["on_episode_step"]({
+                "env": async_vector_env,
+                "episode": episode
+            })
+
+        # Cut the batch if we're not packing multiple episodes into one,
+        # or if we've exceeded the requested batch size.
+        if episode.batch_builder.has_pending_data():
+            if (all_done and not pack) or \
+                    episode.batch_builder.count >= unroll_length:
+                outputs.append(episode.batch_builder.build_and_reset(episode))
+            elif all_done:
+                # Make sure postprocessor stays within one episode
+                episode.batch_builder.postprocess_batch_so_far(episode)
+
+        if all_done:
+            # Handle episode termination
+            batch_builder_pool.append(episode.batch_builder)
+            if callbacks.get("on_episode_end"):
+                callbacks["on_episode_end"]({
+                    "env": async_vector_env,
+                    "episode": episode
+                })
+            del active_episodes[env_id]
+            resetted_obs = async_vector_env.try_reset(env_id)
+            if resetted_obs is None:
+                # Reset not supported, drop this env from the ready list
+                if horizon != float("inf"):
+                    raise ValueError(
+                        "Setting episode horizon requires reset() support "
+                        "from the environment.")
             else:
-                all_done = False
-                # At least send an empty dict if not done
-                actions_to_send[env_id] = {}
-
-            # For each agent in the environment
-            for agent_id, raw_obs in agent_obs.items():
-                policy_id = episode.policy_for(agent_id)
-                filtered_obs = _get_or_raise(obs_filters, policy_id)(raw_obs)
-                agent_done = bool(all_done or dones[env_id].get(agent_id))
-                if not agent_done:
+                # Creates a new episode
+                episode = active_episodes[env_id]
+                for agent_id, raw_obs in resetted_obs.items():
+                    policy_id = episode.policy_for(agent_id)
+                    policy = _get_or_raise(policies, policy_id)
+                    prep_obs = _get_or_raise(preprocessors,
+                                             policy_id).transform(raw_obs)
+                    filtered_obs = _get_or_raise(obs_filters,
+                                                 policy_id)(prep_obs)
+                    episode._set_last_observation(agent_id, filtered_obs)
                     to_eval[policy_id].append(
-                        PolicyEvalData(env_id, agent_id, filtered_obs,
-                                       episode.rnn_state_for(agent_id)))
-
-                last_observation = episode.last_observation_for(agent_id)
-                episode._set_last_observation(agent_id, filtered_obs)
-
-                # Record transition info if applicable
-                if last_observation is not None and \
-                        infos[env_id][agent_id].get("training_enabled", True):
-                    episode.batch_builder.add_values(
-                        agent_id,
-                        policy_id,
-                        t=episode.length - 1,
-                        eps_id=episode.episode_id,
-                        obs=last_observation,
-                        actions=episode.last_action_for(agent_id),
-                        rewards=rewards[env_id][agent_id],
-                        dones=agent_done,
-                        infos=infos[env_id][agent_id],
-                        new_obs=filtered_obs,
-                        **episode.last_pi_info_for(agent_id))
-
-            # Cut the batch if we're not packing multiple episodes into one,
-            # or if we've exceeded the requested batch size.
-            if episode.batch_builder.has_pending_data():
-                if (all_done and not pack) or \
-                        episode.batch_builder.count >= num_local_steps:
-                    yield episode.batch_builder.build_and_reset()
-                elif all_done:
-                    # Make sure postprocessor stays within one episode
-                    episode.batch_builder.postprocess_batch_so_far()
-
-            if all_done:
-                # Handle episode termination
-                batch_builder_pool.append(episode.batch_builder)
-                del active_episodes[env_id]
-                resetted_obs = async_vector_env.try_reset(env_id)
-                if resetted_obs is None:
-                    # Reset not supported, drop this env from the ready list
-                    assert horizon == float("inf"), \
-                        "Setting episode horizon requires reset() support."
-                else:
-                    # Creates a new episode
-                    episode = active_episodes[env_id]
-                    for agent_id, raw_obs in resetted_obs.items():
-                        policy_id = episode.policy_for(agent_id)
-                        filtered_obs = _get_or_raise(obs_filters,
-                                                     policy_id)(raw_obs)
-                        episode._set_last_observation(agent_id, filtered_obs)
-                        to_eval[policy_id].append(
-                            PolicyEvalData(env_id, agent_id, filtered_obs,
-                                           episode.rnn_state_for(agent_id)))
-
-        # Batch eval policy actions if possible
-        if tf_sess:
-            builder = TFRunBuilder(tf_sess, "policy_eval")
-            pending_fetches = {}
+                        PolicyEvalData(
+                            env_id, agent_id, filtered_obs,
+                            episode.rnn_state_for(agent_id),
+                            np.zeros_like(
+                                _flatten_action(policy.action_space.sample())),
+                            0.0))
+
+    return active_envs, to_eval, outputs
+
+
+def _do_policy_eval(tf_sess, to_eval, policies, active_episodes, clip_actions):
+    """Call compute actions on observation batches to get next actions.
+
+    Returns:
+        eval_results: dict of policy to compute_action() outputs.
+    """
+
+    eval_results = {}
+
+    if tf_sess:
+        builder = TFRunBuilder(tf_sess, "policy_eval")
+        pending_fetches = {}
+    else:
+        builder = None
+    for policy_id, eval_data in to_eval.items():
+        rnn_in_cols = _to_column_format([t.rnn_state for t in eval_data])
+        policy = _get_or_raise(policies, policy_id)
+        if builder and (policy.compute_actions.__code__ is
+                        TFPolicyGraph.compute_actions.__code__):
+            pending_fetches[policy_id] = policy._build_compute_actions(
+                builder, [t.obs for t in eval_data],
+                rnn_in_cols,
+                prev_action_batch=[t.prev_action for t in eval_data],
+                prev_reward_batch=[t.prev_reward for t in eval_data])
         else:
-            builder = None
-        eval_results = {}
-        rnn_in_cols = {}
-        for policy_id, eval_data in to_eval.items():
-            rnn_in = _to_column_format([t.rnn_state for t in eval_data])
-            rnn_in_cols[policy_id] = rnn_in
+            eval_results[policy_id] = policy.compute_actions(
+                [t.obs for t in eval_data],
+                rnn_in_cols,
+                prev_action_batch=[t.prev_action for t in eval_data],
+                prev_reward_batch=[t.prev_reward for t in eval_data],
+                episodes=[active_episodes[t.env_id] for t in eval_data])
+    if builder:
+        for k, v in pending_fetches.items():
+            eval_results[k] = builder.get(v)
+
+    if clip_actions:
+        for policy_id, results in eval_results.items():
             policy = _get_or_raise(policies, policy_id)
-            if builder and (policy.compute_actions.__code__ is
-                            TFPolicyGraph.compute_actions.__code__):
-                pending_fetches[policy_id] = policy.build_compute_actions(
-                    builder, [t.obs for t in eval_data],
-                    rnn_in,
-                    is_training=True)
+            actions, rnn_out_cols, pi_info_cols = results
+            eval_results[policy_id] = (_clip_actions(
+                actions, policy.action_space), rnn_out_cols, pi_info_cols)
+
+    return eval_results
+
+
+def _process_policy_eval_results(to_eval, eval_results, active_episodes,
+                                 active_envs, off_policy_actions):
+    """Process the output of policy neural network evaluation.
+
+    Records policy evaluation results into the given episode objects and
+    returns replies to send back to agents in the env.
+
+    Returns:
+        actions_to_send: nested dict of env id -> agent id -> agent replies.
+    """
+
+    actions_to_send = defaultdict(dict)
+    for env_id in active_envs:
+        actions_to_send[env_id] = {}  # at minimum send empty dict
+
+    for policy_id, eval_data in to_eval.items():
+        rnn_in_cols = _to_column_format([t.rnn_state for t in eval_data])
+        actions, rnn_out_cols, pi_info_cols = eval_results[policy_id]
+        if len(rnn_in_cols) != len(rnn_out_cols):
+            raise ValueError("Length of RNN in did not match RNN out, got: "
+                             "{} vs {}".format(rnn_in_cols, rnn_out_cols))
+        # Add RNN state info
+        for f_i, column in enumerate(rnn_in_cols):
+            pi_info_cols["state_in_{}".format(f_i)] = column
+        for f_i, column in enumerate(rnn_out_cols):
+            pi_info_cols["state_out_{}".format(f_i)] = column
+        # Save output rows
+        actions = _unbatch_tuple_actions(actions)
+        for i, action in enumerate(actions):
+            env_id = eval_data[i].env_id
+            agent_id = eval_data[i].agent_id
+            actions_to_send[env_id][agent_id] = action
+            episode = active_episodes[env_id]
+            episode._set_rnn_state(agent_id, [c[i] for c in rnn_out_cols])
+            episode._set_last_pi_info(
+                agent_id, {k: v[i]
+                           for k, v in pi_info_cols.items()})
+            if env_id in off_policy_actions and \
+                    agent_id in off_policy_actions[env_id]:
+                episode._set_last_action(agent_id,
+                                         off_policy_actions[env_id][agent_id])
             else:
-                eval_results[policy_id] = policy.compute_actions(
-                    [t.obs for t in eval_data],
-                    rnn_in,
-                    is_training=True,
-                    episodes=[active_episodes[t.env_id] for t in eval_data])
-        if builder:
-            for k, v in pending_fetches.items():
-                eval_results[k] = builder.get(v)
-
-        # Record the policy eval results
-        for policy_id, eval_data in to_eval.items():
-            actions, rnn_out_cols, pi_info_cols = eval_results[policy_id]
-            # Add RNN state info
-            for f_i, column in enumerate(rnn_in_cols[policy_id]):
-                pi_info_cols["state_in_{}".format(f_i)] = column
-            for f_i, column in enumerate(rnn_out_cols):
-                pi_info_cols["state_out_{}".format(f_i)] = column
-            # Save output rows
-            for i, action in enumerate(actions):
-                env_id = eval_data[i].env_id
-                agent_id = eval_data[i].agent_id
-                actions_to_send[env_id][agent_id] = action
-                episode = active_episodes[env_id]
-                episode._set_rnn_state(agent_id, [c[i] for c in rnn_out_cols])
-                episode._set_last_pi_info(
-                    agent_id, {k: v[i]
-                               for k, v in pi_info_cols.items()})
-                if env_id in off_policy_actions and \
-                        agent_id in off_policy_actions[env_id]:
-                    episode._set_last_action(
-                        agent_id, off_policy_actions[env_id][agent_id])
-                else:
-                    episode._set_last_action(agent_id, action)
+                episode._set_last_action(agent_id, action)
 
-        # Return computed actions to ready envs. We also send to envs that have
-        # taken off-policy actions; those envs are free to ignore the action.
-        async_vector_env.send_actions(dict(actions_to_send))
+    return actions_to_send
 
 
 def _fetch_atari_metrics(async_vector_env):
@@ -405,10 +554,48 @@ def _fetch_atari_metrics(async_vector_env):
         if not monitor:
             return None
         for eps_rew, eps_len in monitor.next_episode_results():
-            atari_out.append(RolloutMetrics(eps_len, eps_rew, {}))
+            atari_out.append(RolloutMetrics(eps_len, eps_rew, {}, {}))
     return atari_out
 
 
+def _clip_actions(actions, space):
+    """Called to clip actions to the specified range of this policy.
+
+    Arguments:
+        actions: Batch of actions or TupleActions.
+        space: Action space the actions should be present in.
+
+    Returns:
+        Clipped batch of actions.
+    """
+
+    if isinstance(space, gym.spaces.Box):
+        return np.clip(actions, space.low, space.high)
+    elif isinstance(space, gym.spaces.Tuple):
+        if not isinstance(actions, TupleActions):
+            raise ValueError("Expected tuple space for actions {}: {}".format(
+                actions, space))
+        out = []
+        for a, s in zip(actions.batches, space.spaces):
+            out.append(_clip_actions(a, s))
+        return TupleActions(out)
+    else:
+        return actions
+
+
+def _unbatch_tuple_actions(action_batch):
+    # convert list of batches -> batch of lists
+    if isinstance(action_batch, TupleActions):
+        out = []
+        for j in range(len(action_batch.batches[0])):
+            out.append([
+                action_batch.batches[i][j]
+                for i in range(len(action_batch.batches))
+            ])
+        return out
+    return action_batch
+
+
 def _to_column_format(rnn_state_rows):
     num_cols = len(rnn_state_rows[0])
     return [[row[i] for row in rnn_state_rows] for i in range(num_cols)]
diff --git a/python/ray/rllib/evaluation/tf_policy_graph.py b/python/ray/rllib/evaluation/tf_policy_graph.py
index e9119c87527b4..e5a1d7b19732b 100644
--- a/python/ray/rllib/evaluation/tf_policy_graph.py
+++ b/python/ray/rllib/evaluation/tf_policy_graph.py
@@ -2,14 +2,18 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
 import tensorflow as tf
 import numpy as np
 
 import ray
 from ray.rllib.evaluation.policy_graph import PolicyGraph
 from ray.rllib.models.lstm import chop_into_sequences
-from ray.rllib.utils.tf_run_builder import TFRunBuilder
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.schedules import ConstantSchedule, PiecewiseSchedule
+from ray.rllib.utils.tf_run_builder import TFRunBuilder
+
+logger = logging.getLogger(__name__)
 
 
 class TFPolicyGraph(PolicyGraph):
@@ -27,7 +31,7 @@ class TFPolicyGraph(PolicyGraph):
 
     Examples:
         >>> policy = TFPolicyGraphSubclass(
-            sess, obs_input, action_sampler, loss, loss_inputs, is_training)
+            sess, obs_input, action_sampler, loss, loss_inputs)
 
         >>> print(policy.compute_actions([1, 0, 2]))
         (array([0, 1, 1]), [], {})
@@ -46,8 +50,12 @@ def __init__(self,
                  loss_inputs,
                  state_inputs=None,
                  state_outputs=None,
+                 prev_action_input=None,
+                 prev_reward_input=None,
                  seq_lens=None,
-                 max_seq_len=20):
+                 max_seq_len=20,
+                 batch_divisibility_req=1,
+                 update_ops=None):
         """Initialize the policy graph.
 
         Arguments:
@@ -62,174 +70,261 @@ def __init__(self,
             loss_inputs (list): a (name, placeholder) tuple for each loss
                 input argument. Each placeholder name must correspond to a
                 SampleBatch column key returned by postprocess_trajectory(),
-                and has shape [BATCH_SIZE, data...].
+                and has shape [BATCH_SIZE, data...]. These keys will be read
+                from postprocessed sample batches and fed into the specified
+                placeholders during loss computation.
             state_inputs (list): list of RNN state input Tensors.
             state_outputs (list): list of RNN state output Tensors.
+            prev_action_input (Tensor): placeholder for previous actions
+            prev_reward_input (Tensor): placeholder for previous rewards
             seq_lens (Tensor): placeholder for RNN sequence lengths, of shape
                 [NUM_SEQUENCES]. Note that NUM_SEQUENCES << BATCH_SIZE. See
                 models/lstm.py for more information.
             max_seq_len (int): max sequence length for LSTM training.
+            batch_divisibility_req (int): pad all agent experiences batches to
+                multiples of this value. This only has an effect if not using
+                a LSTM model.
+            update_ops (list): override the batchnorm update ops to run when
+                applying gradients. Otherwise we run all update ops found in
+                the current variable scope.
         """
 
         self.observation_space = observation_space
         self.action_space = action_space
         self._sess = sess
         self._obs_input = obs_input
+        self._prev_action_input = prev_action_input
+        self._prev_reward_input = prev_reward_input
         self._sampler = action_sampler
         self._loss = loss
         self._loss_inputs = loss_inputs
         self._loss_input_dict = dict(self._loss_inputs)
-        self._is_training = tf.placeholder_with_default(True, ())
+        self._is_training = self._get_is_training_placeholder()
         self._state_inputs = state_inputs or []
         self._state_outputs = state_outputs or []
         for i, ph in enumerate(self._state_inputs):
             self._loss_input_dict["state_in_{}".format(i)] = ph
         self._seq_lens = seq_lens
         self._max_seq_len = max_seq_len
+        self._batch_divisibility_req = batch_divisibility_req
+
         self._optimizer = self.optimizer()
         self._grads_and_vars = [(g, v)
                                 for (g, v) in self.gradients(self._optimizer)
                                 if g is not None]
         self._grads = [g for (g, v) in self._grads_and_vars]
-        self._apply_op = self._optimizer.apply_gradients(self._grads_and_vars)
         self._variables = ray.experimental.TensorFlowVariables(
             self._loss, self._sess)
 
-        assert len(self._state_inputs) == len(self._state_outputs) == \
-            len(self.get_initial_state()), \
-            (self._state_inputs, self._state_outputs, self.get_initial_state())
-        if self._state_inputs:
-            assert self._seq_lens is not None
-
-    def build_compute_actions(self,
-                              builder,
-                              obs_batch,
-                              state_batches=None,
-                              is_training=False,
-                              episodes=None):
-        state_batches = state_batches or []
-        assert len(self._state_inputs) == len(state_batches), \
-            (self._state_inputs, state_batches)
-        builder.add_feed_dict(self.extra_compute_action_feed_dict())
-        builder.add_feed_dict({self._obs_input: obs_batch})
-        if state_batches:
-            builder.add_feed_dict({self._seq_lens: np.ones(len(obs_batch))})
-        builder.add_feed_dict({self._is_training: is_training})
-        builder.add_feed_dict(dict(zip(self._state_inputs, state_batches)))
-        fetches = builder.add_fetches([self._sampler] + self._state_outputs +
-                                      [self.extra_compute_action_fetches()])
-        return fetches[0], fetches[1:-1], fetches[-1]
-
+        # gather update ops for any batch norm layers
+        if update_ops:
+            self._update_ops = update_ops
+        else:
+            self._update_ops = tf.get_collection(
+                tf.GraphKeys.UPDATE_OPS, scope=tf.get_variable_scope().name)
+        if self._update_ops:
+            logger.debug("Update ops to run on apply gradient: {}".format(
+                self._update_ops))
+        with tf.control_dependencies(self._update_ops):
+            # specify global_step for TD3 which needs to count the num updates
+            self._apply_op = self._optimizer.apply_gradients(
+                self._grads_and_vars,
+                global_step=tf.train.get_or_create_global_step())
+
+        if len(self._state_inputs) != len(self._state_outputs):
+            raise ValueError(
+                "Number of state input and output tensors must match, got: "
+                "{} vs {}".format(self._state_inputs, self._state_outputs))
+        if len(self.get_initial_state()) != len(self._state_inputs):
+            raise ValueError(
+                "Length of initial state must match number of state inputs, "
+                "got: {} vs {}".format(self.get_initial_state(),
+                                       self._state_inputs))
+        if self._state_inputs and self._seq_lens is None:
+            raise ValueError(
+                "seq_lens tensor must be given if state inputs are defined")
+
+        logger.debug("Created {} with loss inputs: {}".format(
+            self, self._loss_input_dict))
+
+    @override(PolicyGraph)
     def compute_actions(self,
                         obs_batch,
                         state_batches=None,
-                        is_training=False,
+                        prev_action_batch=None,
+                        prev_reward_batch=None,
                         episodes=None):
         builder = TFRunBuilder(self._sess, "compute_actions")
-        fetches = self.build_compute_actions(builder, obs_batch, state_batches,
-                                             is_training)
+        fetches = self._build_compute_actions(builder, obs_batch,
+                                              state_batches, prev_action_batch,
+                                              prev_reward_batch)
         return builder.get(fetches)
 
-    def _get_loss_inputs_dict(self, batch):
-        feed_dict = {}
-
-        # Simple case
-        if not self._state_inputs:
-            for k, ph in self._loss_inputs:
-                feed_dict[ph] = batch[k]
-            return feed_dict
-
-        # RNN case
-        feature_keys = [k for k, v in self._loss_inputs]
-        state_keys = [
-            "state_in_{}".format(i) for i in range(len(self._state_inputs))
-        ]
-        feature_sequences, initial_states, seq_lens = chop_into_sequences(
-            batch["eps_id"], [batch[k] for k in feature_keys],
-            [batch[k] for k in state_keys], self._max_seq_len)
-        for k, v in zip(feature_keys, feature_sequences):
-            feed_dict[self._loss_input_dict[k]] = v
-        for k, v in zip(state_keys, initial_states):
-            feed_dict[self._loss_input_dict[k]] = v
-        feed_dict[self._seq_lens] = seq_lens
-        return feed_dict
-
-    def build_compute_gradients(self, builder, postprocessed_batch):
-        builder.add_feed_dict(self.extra_compute_grad_feed_dict())
-        builder.add_feed_dict({self._is_training: True})
-        builder.add_feed_dict(self._get_loss_inputs_dict(postprocessed_batch))
-        fetches = builder.add_fetches(
-            [self._grads, self.extra_compute_grad_fetches()])
-        return fetches[0], fetches[1]
-
+    @override(PolicyGraph)
     def compute_gradients(self, postprocessed_batch):
         builder = TFRunBuilder(self._sess, "compute_gradients")
-        fetches = self.build_compute_gradients(builder, postprocessed_batch)
+        fetches = self._build_compute_gradients(builder, postprocessed_batch)
         return builder.get(fetches)
 
-    def build_apply_gradients(self, builder, gradients):
-        assert len(gradients) == len(self._grads), (gradients, self._grads)
-        builder.add_feed_dict(self.extra_apply_grad_feed_dict())
-        builder.add_feed_dict({self._is_training: True})
-        builder.add_feed_dict(dict(zip(self._grads, gradients)))
-        fetches = builder.add_fetches(
-            [self._apply_op, self.extra_apply_grad_fetches()])
-        return fetches[1]
-
+    @override(PolicyGraph)
     def apply_gradients(self, gradients):
         builder = TFRunBuilder(self._sess, "apply_gradients")
-        fetches = self.build_apply_gradients(builder, gradients)
+        fetches = self._build_apply_gradients(builder, gradients)
         return builder.get(fetches)
 
-    def build_compute_apply(self, builder, postprocessed_batch):
-        builder.add_feed_dict(self.extra_compute_grad_feed_dict())
-        builder.add_feed_dict(self.extra_apply_grad_feed_dict())
-        builder.add_feed_dict(self._get_loss_inputs_dict(postprocessed_batch))
-        builder.add_feed_dict({self._is_training: True})
-        fetches = builder.add_fetches([
-            self._apply_op,
-            self.extra_compute_grad_fetches(),
-            self.extra_apply_grad_fetches()
-        ])
-        return fetches[1], fetches[2]
-
+    @override(PolicyGraph)
     def compute_apply(self, postprocessed_batch):
         builder = TFRunBuilder(self._sess, "compute_apply")
-        fetches = self.build_compute_apply(builder, postprocessed_batch)
+        fetches = self._build_compute_apply(builder, postprocessed_batch)
         return builder.get(fetches)
 
+    @override(PolicyGraph)
     def get_weights(self):
         return self._variables.get_flat()
 
+    @override(PolicyGraph)
     def set_weights(self, weights):
         return self._variables.set_flat(weights)
 
+    def copy(self, existing_inputs):
+        """Creates a copy of self using existing input placeholders.
+
+        Optional, only required to work with the multi-GPU optimizer."""
+        raise NotImplementedError
+
     def extra_compute_action_feed_dict(self):
+        """Extra dict to pass to the compute actions session run."""
         return {}
 
     def extra_compute_action_fetches(self):
+        """Extra values to fetch and return from compute_actions()."""
         return {}  # e.g, value function
 
     def extra_compute_grad_feed_dict(self):
+        """Extra dict to pass to the compute gradients session run."""
         return {}  # e.g, kl_coeff
 
     def extra_compute_grad_fetches(self):
+        """Extra values to fetch and return from compute_gradients()."""
         return {}  # e.g, td error
 
     def extra_apply_grad_feed_dict(self):
+        """Extra dict to pass to the apply gradients session run."""
         return {}
 
     def extra_apply_grad_fetches(self):
+        """Extra values to fetch and return from apply_gradients()."""
         return {}  # e.g., batch norm updates
 
     def optimizer(self):
+        """TF optimizer to use for policy optimization."""
         return tf.train.AdamOptimizer()
 
     def gradients(self, optimizer):
+        """Override for custom gradient computation."""
         return optimizer.compute_gradients(self._loss)
 
-    def loss_inputs(self):
-        return self._loss_inputs
+    def _build_compute_actions(self,
+                               builder,
+                               obs_batch,
+                               state_batches=None,
+                               prev_action_batch=None,
+                               prev_reward_batch=None,
+                               episodes=None):
+        state_batches = state_batches or []
+        assert len(self._state_inputs) == len(state_batches), \
+            (self._state_inputs, state_batches)
+        builder.add_feed_dict(self.extra_compute_action_feed_dict())
+        builder.add_feed_dict({self._obs_input: obs_batch})
+        if state_batches:
+            builder.add_feed_dict({self._seq_lens: np.ones(len(obs_batch))})
+        if self._prev_action_input is not None and prev_action_batch:
+            builder.add_feed_dict({self._prev_action_input: prev_action_batch})
+        if self._prev_reward_input is not None and prev_reward_batch:
+            builder.add_feed_dict({self._prev_reward_input: prev_reward_batch})
+        builder.add_feed_dict({self._is_training: False})
+        builder.add_feed_dict(dict(zip(self._state_inputs, state_batches)))
+        fetches = builder.add_fetches([self._sampler] + self._state_outputs +
+                                      [self.extra_compute_action_fetches()])
+        return fetches[0], fetches[1:-1], fetches[-1]
+
+    def _build_compute_gradients(self, builder, postprocessed_batch):
+        builder.add_feed_dict(self.extra_compute_grad_feed_dict())
+        builder.add_feed_dict({self._is_training: True})
+        builder.add_feed_dict(self._get_loss_inputs_dict(postprocessed_batch))
+        fetches = builder.add_fetches(
+            [self._grads, self.extra_compute_grad_fetches()])
+        return fetches[0], fetches[1]
+
+    def _build_apply_gradients(self, builder, gradients):
+        assert len(gradients) == len(self._grads), (gradients, self._grads)
+        builder.add_feed_dict(self.extra_apply_grad_feed_dict())
+        builder.add_feed_dict({self._is_training: True})
+        builder.add_feed_dict(dict(zip(self._grads, gradients)))
+        fetches = builder.add_fetches(
+            [self._apply_op, self.extra_apply_grad_fetches()])
+        return fetches[1]
+
+    def _build_compute_apply(self, builder, postprocessed_batch):
+        builder.add_feed_dict(self.extra_compute_grad_feed_dict())
+        builder.add_feed_dict(self.extra_apply_grad_feed_dict())
+        builder.add_feed_dict(self._get_loss_inputs_dict(postprocessed_batch))
+        builder.add_feed_dict({self._is_training: True})
+        fetches = builder.add_fetches([
+            self._apply_op,
+            self.extra_compute_grad_fetches(),
+            self.extra_apply_grad_fetches()
+        ])
+        return fetches[1], fetches[2]
+
+    def _get_is_training_placeholder(self):
+        """Get the placeholder for _is_training, i.e., for batch norm layers.
+
+        This can be called safely before __init__ has run.
+        """
+        if not hasattr(self, "_is_training"):
+            self._is_training = tf.placeholder_with_default(False, ())
+        return self._is_training
+
+    def _get_loss_inputs_dict(self, batch):
+        feed_dict = {}
+        if self._batch_divisibility_req > 1:
+            meets_divisibility_reqs = (
+                len(batch["obs"]) % self._batch_divisibility_req == 0
+                and max(batch["agent_index"]) == 0)  # not multiagent
+        else:
+            meets_divisibility_reqs = True
+
+        # Simple case: not RNN nor do we need to pad
+        if not self._state_inputs and meets_divisibility_reqs:
+            for k, ph in self._loss_inputs:
+                feed_dict[ph] = batch[k]
+            return feed_dict
+
+        if self._state_inputs:
+            max_seq_len = self._max_seq_len
+            dynamic_max = True
+        else:
+            max_seq_len = self._batch_divisibility_req
+            dynamic_max = False
+
+        # RNN or multi-agent case
+        feature_keys = [k for k, v in self._loss_inputs]
+        state_keys = [
+            "state_in_{}".format(i) for i in range(len(self._state_inputs))
+        ]
+        feature_sequences, initial_states, seq_lens = chop_into_sequences(
+            batch["eps_id"],
+            batch["agent_index"], [batch[k] for k in feature_keys],
+            [batch[k] for k in state_keys],
+            max_seq_len,
+            dynamic_max=dynamic_max)
+        for k, v in zip(feature_keys, feature_sequences):
+            feed_dict[self._loss_input_dict[k]] = v
+        for k, v in zip(state_keys, initial_states):
+            feed_dict[self._loss_input_dict[k]] = v
+        feed_dict[self._seq_lens] = seq_lens
+        return feed_dict
 
 
 class LearningRateSchedule(object):
@@ -243,11 +338,13 @@ def __init__(self, lr, lr_schedule):
             self.lr_schedule = PiecewiseSchedule(
                 lr_schedule, outside_value=lr_schedule[-1][-1])
 
+    @override(PolicyGraph)
     def on_global_var_update(self, global_vars):
         super(LearningRateSchedule, self).on_global_var_update(global_vars)
         self.cur_lr.load(
             self.lr_schedule.value(global_vars["timestep"]),
             session=self._sess)
 
+    @override(TFPolicyGraph)
     def optimizer(self):
         return tf.train.AdamOptimizer(self.cur_lr)
diff --git a/python/ray/rllib/evaluation/torch_policy_graph.py b/python/ray/rllib/evaluation/torch_policy_graph.py
index 741357f3aa8d5..c8e86e8451c73 100644
--- a/python/ray/rllib/evaluation/torch_policy_graph.py
+++ b/python/ray/rllib/evaluation/torch_policy_graph.py
@@ -13,6 +13,7 @@
     pass  # soft dep
 
 from ray.rllib.evaluation.policy_graph import PolicyGraph
+from ray.rllib.utils.annotations import override
 
 
 class TorchPolicyGraph(PolicyGraph):
@@ -56,21 +57,12 @@ def __init__(self, observation_space, action_space, model, loss,
         self._loss_inputs = loss_inputs
         self._optimizer = self.optimizer()
 
-    def extra_action_out(self, model_out):
-        """Returns dict of extra info to include in experience batch.
-
-        Arguments:
-            model_out (list): Outputs of the policy model module."""
-        return {}
-
-    def optimizer(self):
-        """Custom PyTorch optimizer to use."""
-        return torch.optim.Adam(self._model.parameters())
-
+    @override(PolicyGraph)
     def compute_actions(self,
                         obs_batch,
                         state_batches=None,
-                        is_training=False,
+                        prev_action_batch=None,
+                        prev_reward_batch=None,
                         episodes=None):
         if state_batches:
             raise NotImplementedError("Torch RNN support")
@@ -82,6 +74,7 @@ def compute_actions(self,
                 actions = F.softmax(logits, dim=1).multinomial(1).squeeze(0)
                 return var_to_np(actions), [], self.extra_action_out(model_out)
 
+    @override(PolicyGraph)
     def compute_gradients(self, postprocessed_batch):
         with self.lock:
             loss_in = []
@@ -95,6 +88,7 @@ def compute_gradients(self, postprocessed_batch):
             grads = [var_to_np(p.grad.data) for p in self._model.parameters()]
             return grads, {}
 
+    @override(PolicyGraph)
     def apply_gradients(self, gradients):
         with self.lock:
             for g, p in zip(gradients, self._model.parameters()):
@@ -102,10 +96,23 @@ def apply_gradients(self, gradients):
             self._optimizer.step()
             return {}
 
+    @override(PolicyGraph)
     def get_weights(self):
         with self.lock:
             return self._model.state_dict()
 
+    @override(PolicyGraph)
     def set_weights(self, weights):
         with self.lock:
             self._model.load_state_dict(weights)
+
+    def extra_action_out(self, model_out):
+        """Returns dict of extra info to include in experience batch.
+
+        Arguments:
+            model_out (list): Outputs of the policy model module."""
+        return {}
+
+    def optimizer(self):
+        """Custom PyTorch optimizer to use."""
+        return torch.optim.Adam(self._model.parameters())
diff --git a/python/ray/rllib/examples/batch_norm_model.py b/python/ray/rllib/examples/batch_norm_model.py
new file mode 100644
index 0000000000000..abd4b53666a2a
--- /dev/null
+++ b/python/ray/rllib/examples/batch_norm_model.py
@@ -0,0 +1,64 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+"""Example of using a custom model with batch norm."""
+
+import argparse
+
+import tensorflow as tf
+import tensorflow.contrib.slim as slim
+
+import ray
+from ray.rllib.models import Model, ModelCatalog
+from ray.rllib.models.misc import normc_initializer
+from ray.tune import run_experiments
+
+parser = argparse.ArgumentParser()
+parser.add_argument("--num-iters", type=int, default=200)
+parser.add_argument("--run", type=str, default="PPO")
+
+
+class BatchNormModel(Model):
+    def _build_layers_v2(self, input_dict, num_outputs, options):
+        last_layer = input_dict["obs"]
+        hiddens = [256, 256]
+        for i, size in enumerate(hiddens):
+            label = "fc{}".format(i)
+            last_layer = slim.fully_connected(
+                last_layer,
+                size,
+                weights_initializer=normc_initializer(1.0),
+                activation_fn=tf.nn.tanh,
+                scope=label)
+            # Add a batch norm layer
+            last_layer = tf.layers.batch_normalization(
+                last_layer, training=input_dict["is_training"])
+        output = slim.fully_connected(
+            last_layer,
+            num_outputs,
+            weights_initializer=normc_initializer(0.01),
+            activation_fn=None,
+            scope="fc_out")
+        return output, last_layer
+
+
+if __name__ == "__main__":
+    args = parser.parse_args()
+    ray.init()
+
+    ModelCatalog.register_custom_model("bn_model", BatchNormModel)
+    run_experiments({
+        "batch_norm_demo": {
+            "run": args.run,
+            "env": "Pendulum-v0" if args.run == "DDPG" else "CartPole-v0",
+            "stop": {
+                "training_iteration": args.num_iters
+            },
+            "config": {
+                "model": {
+                    "custom_model": "bn_model",
+                },
+                "num_workers": 0,
+            },
+        },
+    })
diff --git a/examples/carla/README b/python/ray/rllib/examples/carla/README
similarity index 100%
rename from examples/carla/README
rename to python/ray/rllib/examples/carla/README
diff --git a/examples/carla/env.py b/python/ray/rllib/examples/carla/env.py
similarity index 83%
rename from examples/carla/env.py
rename to python/ray/rllib/examples/carla/env.py
index c88a71b28f51b..af5b619afcdb4 100644
--- a/examples/carla/env.py
+++ b/python/ray/rllib/examples/carla/env.py
@@ -33,8 +33,8 @@
     os.makedirs(CARLA_OUT_PATH)
 
 # Set this to the path of your Carla binary
-SERVER_BINARY = os.environ.get(
-    "CARLA_SERVER", os.path.expanduser("~/CARLA_0.7.0/CarlaUE4.sh"))
+SERVER_BINARY = os.environ.get("CARLA_SERVER",
+                               os.path.expanduser("~/CARLA_0.7.0/CarlaUE4.sh"))
 
 assert os.path.exists(SERVER_BINARY)
 if "CARLA_PY_PATH" in os.environ:
@@ -97,7 +97,6 @@
     "squash_action_logits": False,
 }
 
-
 DISCRETE_ACTIONS = {
     # coast
     0: [0.0, 0.0],
@@ -119,7 +118,6 @@
     8: [-0.5, 0.5],
 }
 
-
 live_carla_processes = set()
 
 
@@ -133,7 +131,6 @@ def cleanup():
 
 
 class CarlaEnv(gym.Env):
-
     def __init__(self, config=ENV_CONFIG):
         self.config = config
         self.city = self.config["server_map"].split("/")[-1]
@@ -143,21 +140,27 @@ def __init__(self, config=ENV_CONFIG):
         if config["discrete_actions"]:
             self.action_space = Discrete(len(DISCRETE_ACTIONS))
         else:
-            self.action_space = Box(-1.0, 1.0, shape=(2,), dtype=np.float32)
+            self.action_space = Box(-1.0, 1.0, shape=(2, ), dtype=np.float32)
         if config["use_depth_camera"]:
             image_space = Box(
-                -1.0, 1.0, shape=(
-                    config["y_res"], config["x_res"],
-                    1 * config["framestack"]), dtype=np.float32)
+                -1.0,
+                1.0,
+                shape=(config["y_res"], config["x_res"],
+                       1 * config["framestack"]),
+                dtype=np.float32)
         else:
             image_space = Box(
-                0, 255, shape=(
-                    config["y_res"], config["x_res"],
-                    3 * config["framestack"]), dtype=np.uint8)
+                0,
+                255,
+                shape=(config["y_res"], config["x_res"],
+                       3 * config["framestack"]),
+                dtype=np.uint8)
         self.observation_space = Tuple(  # forward_speed, dist to goal
-            [image_space,
-             Discrete(len(COMMANDS_ENUM)),  # next_command
-             Box(-128.0, 128.0, shape=(2,), dtype=np.float32)])
+            [
+                image_space,
+                Discrete(len(COMMANDS_ENUM)),  # next_command
+                Box(-128.0, 128.0, shape=(2, ), dtype=np.float32)
+            ])
 
         # TODO(ekl) this isn't really a proper gym spec
         self._spec = lambda: None
@@ -185,11 +188,13 @@ def init_server(self):
         # Create a new server process and start the client.
         self.server_port = random.randint(10000, 60000)
         self.server_process = subprocess.Popen(
-            [SERVER_BINARY, self.config["server_map"],
-             "-windowed", "-ResX=400", "-ResY=300",
-             "-carla-server",
-             "-carla-world-port={}".format(self.server_port)],
-            preexec_fn=os.setsid, stdout=open(os.devnull, "w"))
+            [
+                SERVER_BINARY, self.config["server_map"], "-windowed",
+                "-ResX=400", "-ResY=300", "-carla-server",
+                "-carla-world-port={}".format(self.server_port)
+            ],
+            preexec_fn=os.setsid,
+            stdout=open(os.devnull, "w"))
         live_carla_processes.add(os.getpgid(self.server_process.pid))
 
         for i in range(RETRIES_ON_ERROR):
@@ -257,14 +262,14 @@ def _reset(self):
 
         if self.config["use_depth_camera"]:
             camera1 = Camera("CameraDepth", PostProcessing="Depth")
-            camera1.set_image_size(
-                self.config["render_x_res"], self.config["render_y_res"])
+            camera1.set_image_size(self.config["render_x_res"],
+                                   self.config["render_y_res"])
             camera1.set_position(30, 0, 130)
             settings.add_sensor(camera1)
 
         camera2 = Camera("CameraRGB")
-        camera2.set_image_size(
-            self.config["render_x_res"], self.config["render_y_res"])
+        camera2.set_image_size(self.config["render_x_res"],
+                               self.config["render_y_res"])
         camera2.set_position(30, 0, 130)
         settings.add_sensor(camera2)
 
@@ -274,13 +279,14 @@ def _reset(self):
         self.start_pos = positions[self.scenario["start_pos_id"]]
         self.end_pos = positions[self.scenario["end_pos_id"]]
         self.start_coord = [
-            self.start_pos.location.x // 100, self.start_pos.location.y // 100]
+            self.start_pos.location.x // 100, self.start_pos.location.y // 100
+        ]
         self.end_coord = [
-            self.end_pos.location.x // 100, self.end_pos.location.y // 100]
-        print(
-            "Start pos {} ({}), end {} ({})".format(
-                self.scenario["start_pos_id"], self.start_coord,
-                self.scenario["end_pos_id"], self.end_coord))
+            self.end_pos.location.x // 100, self.end_pos.location.y // 100
+        ]
+        print("Start pos {} ({}), end {} ({})".format(
+            self.scenario["start_pos_id"], self.start_coord,
+            self.scenario["end_pos_id"], self.end_coord))
 
         # Notify the server that we want to start the episode at the
         # player_start index. This function blocks until the server is ready
@@ -300,11 +306,10 @@ def encode_obs(self, image, py_measurements):
             prev_image = image
         if self.config["framestack"] == 2:
             image = np.concatenate([prev_image, image], axis=2)
-        obs = (
-            image,
-            COMMAND_ORDINAL[py_measurements["next_command"]],
-            [py_measurements["forward_speed"],
-             py_measurements["distance_to_goal"]])
+        obs = (image, COMMAND_ORDINAL[py_measurements["next_command"]], [
+            py_measurements["forward_speed"],
+            py_measurements["distance_to_goal"]
+        ])
         self.last_obs = obs
         return obs
 
@@ -313,9 +318,8 @@ def step(self, action):
             obs = self._step(action)
             return obs
         except Exception:
-            print(
-                "Error during step, terminating episode early",
-                traceback.format_exc())
+            print("Error during step, terminating episode early",
+                  traceback.format_exc())
             self.clear_server_state()
             return (self.last_obs, 0.0, True, {})
 
@@ -336,12 +340,14 @@ def _step(self, action):
         hand_brake = False
 
         if self.config["verbose"]:
-            print(
-                "steer", steer, "throttle", throttle, "brake", brake,
-                "reverse", reverse)
+            print("steer", steer, "throttle", throttle, "brake", brake,
+                  "reverse", reverse)
 
         self.client.send_control(
-            steer=steer, throttle=throttle, brake=brake, hand_brake=hand_brake,
+            steer=steer,
+            throttle=throttle,
+            brake=brake,
+            hand_brake=hand_brake,
             reverse=reverse)
 
         # Process observations
@@ -359,15 +365,14 @@ def _step(self, action):
             "reverse": reverse,
             "hand_brake": hand_brake,
         }
-        reward = compute_reward(
-            self, self.prev_measurement, py_measurements)
+        reward = compute_reward(self, self.prev_measurement, py_measurements)
         self.total_reward += reward
         py_measurements["reward"] = reward
         py_measurements["total_reward"] = self.total_reward
-        done = (self.num_steps > self.scenario["max_steps"] or
-                py_measurements["next_command"] == "REACH_GOAL" or
-                (self.config["early_terminate_on_collision"] and
-                 collided_done(py_measurements)))
+        done = (self.num_steps > self.scenario["max_steps"]
+                or py_measurements["next_command"] == "REACH_GOAL"
+                or (self.config["early_terminate_on_collision"]
+                    and collided_done(py_measurements)))
         py_measurements["done"] = done
         self.prev_measurement = py_measurements
 
@@ -377,8 +382,7 @@ def _step(self, action):
                 self.measurements_file = open(
                     os.path.join(
                         CARLA_OUT_PATH,
-                        "measurements_{}.json".format(self.episode_id)),
-                    "w")
+                        "measurements_{}.json".format(self.episode_id)), "w")
             self.measurements_file.write(json.dumps(py_measurements))
             self.measurements_file.write("\n")
             if done:
@@ -389,9 +393,8 @@ def _step(self, action):
 
         self.num_steps += 1
         image = self.preprocess_image(image)
-        return (
-            self.encode_obs(image, py_measurements), reward, done,
-            py_measurements)
+        return (self.encode_obs(image, py_measurements), reward, done,
+                py_measurements)
 
     def images_to_video(self):
         videos_dir = os.path.join(CARLA_OUT_PATH, "Videos")
@@ -413,15 +416,15 @@ def preprocess_image(self, image):
         if self.config["use_depth_camera"]:
             assert self.config["use_depth_camera"]
             data = (image.data - 0.5) * 2
-            data = data.reshape(
-                self.config["render_y_res"], self.config["render_x_res"], 1)
+            data = data.reshape(self.config["render_y_res"],
+                                self.config["render_x_res"], 1)
             data = cv2.resize(
                 data, (self.config["x_res"], self.config["y_res"]),
                 interpolation=cv2.INTER_AREA)
             data = np.expand_dims(data, 2)
         else:
-            data = image.data.reshape(
-                self.config["render_y_res"], self.config["render_x_res"], 3)
+            data = image.data.reshape(self.config["render_y_res"],
+                                      self.config["render_x_res"], 3)
             data = cv2.resize(
                 data, (self.config["x_res"], self.config["y_res"]),
                 interpolation=cv2.INTER_AREA)
@@ -448,36 +451,39 @@ def _read_observation(self):
         cur = measurements.player_measurements
 
         if self.config["enable_planner"]:
-            next_command = COMMANDS_ENUM[
-                self.planner.get_next_command(
-                    [cur.transform.location.x, cur.transform.location.y,
-                     GROUND_Z],
-                    [cur.transform.orientation.x, cur.transform.orientation.y,
-                     GROUND_Z],
-                    [self.end_pos.location.x, self.end_pos.location.y,
-                     GROUND_Z],
-                    [self.end_pos.orientation.x, self.end_pos.orientation.y,
-                     GROUND_Z])
-            ]
+            next_command = COMMANDS_ENUM[self.planner.get_next_command(
+                [cur.transform.location.x, cur.transform.location.y, GROUND_Z],
+                [
+                    cur.transform.orientation.x, cur.transform.orientation.y,
+                    GROUND_Z
+                ],
+                [self.end_pos.location.x, self.end_pos.location.y, GROUND_Z], [
+                    self.end_pos.orientation.x, self.end_pos.orientation.y,
+                    GROUND_Z
+                ])]
         else:
             next_command = "LANE_FOLLOW"
 
         if next_command == "REACH_GOAL":
             distance_to_goal = 0.0  # avoids crash in planner
         elif self.config["enable_planner"]:
-            distance_to_goal = self.planner.get_shortest_path_distance(
-                [cur.transform.location.x, cur.transform.location.y, GROUND_Z],
-                [cur.transform.orientation.x, cur.transform.orientation.y,
-                 GROUND_Z],
-                [self.end_pos.location.x, self.end_pos.location.y, GROUND_Z],
-                [self.end_pos.orientation.x, self.end_pos.orientation.y,
-                 GROUND_Z]) / 100
+            distance_to_goal = self.planner.get_shortest_path_distance([
+                cur.transform.location.x, cur.transform.location.y, GROUND_Z
+            ], [
+                cur.transform.orientation.x, cur.transform.orientation.y,
+                GROUND_Z
+            ], [self.end_pos.location.x, self.end_pos.location.y, GROUND_Z], [
+                self.end_pos.orientation.x, self.end_pos.orientation.y,
+                GROUND_Z
+            ]) / 100
         else:
             distance_to_goal = -1
 
-        distance_to_goal_euclidean = float(np.linalg.norm(
-            [cur.transform.location.x - self.end_pos.location.x,
-             cur.transform.location.y - self.end_pos.location.y]) / 100)
+        distance_to_goal_euclidean = float(
+            np.linalg.norm([
+                cur.transform.location.x - self.end_pos.location.x,
+                cur.transform.location.y - self.end_pos.location.y
+            ]) / 100)
 
         py_measurements = {
             "episode_id": self.episode_id,
@@ -513,8 +519,8 @@ def _read_observation(self):
                 if not os.path.exists(out_dir):
                     os.makedirs(out_dir)
                 out_file = os.path.join(
-                    out_dir,
-                    "{}_{:>04}.jpg".format(self.episode_id, self.num_steps))
+                    out_dir, "{}_{:>04}.jpg".format(self.episode_id,
+                                                    self.num_steps))
                 scipy.misc.imsave(out_file, image.data)
 
         assert observation is not None, sensor_data
@@ -621,8 +627,7 @@ def compute_reward_lane_keep(env, prev, current):
 
 
 def compute_reward(env, prev, current):
-    return REWARD_FUNCTIONS[env.config["reward_function"]](
-        env, prev, current)
+    return REWARD_FUNCTIONS[env.config["reward_function"]](env, prev, current)
 
 
 def print_measurements(measurements):
@@ -654,9 +659,8 @@ def sigmoid(x):
 
 def collided_done(py_measurements):
     m = py_measurements
-    collided = (
-        m["collision_vehicles"] > 0 or m["collision_pedestrians"] > 0 or
-        m["collision_other"] > 0)
+    collided = (m["collision_vehicles"] > 0 or m["collision_pedestrians"] > 0
+                or m["collision_other"] > 0)
     return bool(collided or m["total_reward"] < -100)
 
 
diff --git a/examples/carla/models.py b/python/ray/rllib/examples/carla/models.py
similarity index 81%
rename from examples/carla/models.py
rename to python/ray/rllib/examples/carla/models.py
index 9233c9c8ed2be..3f8cc0c5ba47b 100644
--- a/examples/carla/models.py
+++ b/python/ray/rllib/examples/carla/models.py
@@ -20,6 +20,7 @@ class CarlaModel(Model):
     further fully connected layers.
     """
 
+    # TODO(ekl): use build_layers_v2 for native dict space support
     def _build_layers(self, inputs, num_outputs, options):
         # Parse options
         image_shape = options["custom_options"]["image_shape"]
@@ -43,8 +44,8 @@ def _build_layers(self, inputs, num_outputs, options):
             (inputs.shape.as_list()[1:], expected_shape)
 
         # Reshape the input vector back into its components
-        vision_in = tf.reshape(
-            inputs[:, :image_size], [tf.shape(inputs)[0]] + image_shape)
+        vision_in = tf.reshape(inputs[:, :image_size],
+                               [tf.shape(inputs)[0]] + image_shape)
         metrics_in = inputs[:, image_size:]
         print("Vision in shape", vision_in)
         print("Metrics in shape", metrics_in)
@@ -53,18 +54,26 @@ def _build_layers(self, inputs, num_outputs, options):
         with tf.name_scope("carla_vision"):
             for i, (out_size, kernel, stride) in enumerate(convs[:-1], 1):
                 vision_in = slim.conv2d(
-                    vision_in, out_size, kernel, stride,
+                    vision_in,
+                    out_size,
+                    kernel,
+                    stride,
                     scope="conv{}".format(i))
             out_size, kernel, stride = convs[-1]
             vision_in = slim.conv2d(
-                vision_in, out_size, kernel, stride,
-                padding="VALID", scope="conv_out")
+                vision_in,
+                out_size,
+                kernel,
+                stride,
+                padding="VALID",
+                scope="conv_out")
             vision_in = tf.squeeze(vision_in, [1, 2])
 
         # Setup metrics layer
         with tf.name_scope("carla_metrics"):
             metrics_in = slim.fully_connected(
-                metrics_in, 64,
+                metrics_in,
+                64,
                 weights_initializer=xavier_initializer(),
                 activation_fn=activation,
                 scope="metrics_out")
@@ -79,15 +88,18 @@ def _build_layers(self, inputs, num_outputs, options):
             print("Shape of concatenated out is", last_layer.shape)
             for size in hiddens:
                 last_layer = slim.fully_connected(
-                    last_layer, size,
+                    last_layer,
+                    size,
                     weights_initializer=xavier_initializer(),
                     activation_fn=activation,
                     scope="fc{}".format(i))
                 i += 1
             output = slim.fully_connected(
-                last_layer, num_outputs,
+                last_layer,
+                num_outputs,
                 weights_initializer=normc_initializer(0.01),
-                activation_fn=None, scope="fc_out")
+                activation_fn=None,
+                scope="fc_out")
 
         return output, last_layer
 
diff --git a/python/ray/rllib/examples/carla/scenarios.py b/python/ray/rllib/examples/carla/scenarios.py
new file mode 100644
index 0000000000000..beedd2989d5cf
--- /dev/null
+++ b/python/ray/rllib/examples/carla/scenarios.py
@@ -0,0 +1,131 @@
+"""Collection of Carla scenarios, including those from the CoRL 2017 paper."""
+
+TEST_WEATHERS = [0, 2, 5, 7, 9, 10, 11, 12, 13]
+TRAIN_WEATHERS = [1, 3, 4, 6, 8, 14]
+
+
+def build_scenario(city, start, end, vehicles, pedestrians, max_steps,
+                   weathers):
+    return {
+        "city": city,
+        "num_vehicles": vehicles,
+        "num_pedestrians": pedestrians,
+        "weather_distribution": weathers,
+        "start_pos_id": start,
+        "end_pos_id": end,
+        "max_steps": max_steps,
+    }
+
+
+# Simple scenario for Town02 that involves driving down a road
+DEFAULT_SCENARIO = build_scenario(
+    city="Town02",
+    start=36,
+    end=40,
+    vehicles=20,
+    pedestrians=40,
+    max_steps=200,
+    weathers=[0])
+
+# Simple scenario for Town02 that involves driving down a road
+LANE_KEEP = build_scenario(
+    city="Town02",
+    start=36,
+    end=40,
+    vehicles=0,
+    pedestrians=0,
+    max_steps=2000,
+    weathers=[0])
+
+# Scenarios from the CoRL2017 paper
+POSES_TOWN1_STRAIGHT = [[36, 40], [39, 35], [110, 114], [7, 3], [0, 4], [
+    68, 50
+], [61, 59], [47, 64], [147, 90], [33, 87], [26, 19], [80, 76], [45, 49], [
+    55, 44
+], [29, 107], [95, 104], [84, 34], [53, 67], [22, 17], [91, 148], [20, 107],
+                        [78, 70], [95, 102], [68, 44], [45, 69]]
+
+POSES_TOWN1_ONE_CURVE = [[138, 17], [47, 16], [26, 9], [42, 49], [140, 124], [
+    85, 98
+], [65, 133], [137, 51], [76, 66], [46, 39], [40, 60], [0, 29], [4, 129], [
+    121, 140
+], [2, 129], [78, 44], [68, 85], [41, 102], [95, 70], [68, 129], [84, 69],
+                         [47, 79], [110, 15], [130, 17], [0, 17]]
+
+POSES_TOWN1_NAV = [[105, 29], [27, 130], [102, 87], [132, 27], [24, 44], [
+    96, 26
+], [34, 67], [28, 1], [140, 134], [105, 9], [148, 129], [65, 18], [21, 16], [
+    147, 97
+], [42, 51], [30, 41], [18, 107], [69, 45], [102, 95], [18, 145], [111, 64],
+                   [79, 45], [84, 69], [73, 31], [37, 81]]
+
+POSES_TOWN2_STRAIGHT = [[38, 34], [4, 2], [12, 10], [62, 55], [43, 47], [
+    64, 66
+], [78, 76], [59, 57], [61, 18], [35, 39], [12, 8], [0, 18], [75, 68], [
+    54, 60
+], [45, 49], [46, 42], [53, 46], [80, 29], [65, 63], [0, 81], [54, 63],
+                        [51, 42], [16, 19], [17, 26], [77, 68]]
+
+POSES_TOWN2_ONE_CURVE = [[37, 76], [8, 24], [60, 69], [38, 10], [21, 1], [
+    58, 71
+], [74, 32], [44, 0], [71, 16], [14, 24], [34, 11], [43, 14], [75, 16], [
+    80, 21
+], [3, 23], [75, 59], [50, 47], [11, 19], [77, 34], [79, 25], [40, 63],
+                         [58, 76], [79, 55], [16, 61], [27, 11]]
+
+POSES_TOWN2_NAV = [[19, 66], [79, 14], [19, 57], [23, 1], [53, 76], [42, 13], [
+    31, 71
+], [33, 5], [54, 30], [10, 61], [66, 3], [27, 12], [79, 19], [2, 29], [16, 14],
+                   [5, 57], [70, 73], [46, 67], [57, 50], [61, 49], [21, 12],
+                   [51, 81], [77, 68], [56, 65], [43, 54]]
+
+TOWN1_STRAIGHT = [
+    build_scenario("Town01", start, end, 0, 0, 300, TEST_WEATHERS)
+    for (start, end) in POSES_TOWN1_STRAIGHT
+]
+
+TOWN1_ONE_CURVE = [
+    build_scenario("Town01", start, end, 0, 0, 600, TEST_WEATHERS)
+    for (start, end) in POSES_TOWN1_ONE_CURVE
+]
+
+TOWN1_NAVIGATION = [
+    build_scenario("Town01", start, end, 0, 0, 900, TEST_WEATHERS)
+    for (start, end) in POSES_TOWN1_NAV
+]
+
+TOWN1_NAVIGATION_DYNAMIC = [
+    build_scenario("Town01", start, end, 20, 50, 900, TEST_WEATHERS)
+    for (start, end) in POSES_TOWN1_NAV
+]
+
+TOWN2_STRAIGHT = [
+    build_scenario("Town02", start, end, 0, 0, 300, TRAIN_WEATHERS)
+    for (start, end) in POSES_TOWN2_STRAIGHT
+]
+
+TOWN2_STRAIGHT_DYNAMIC = [
+    build_scenario("Town02", start, end, 20, 50, 300, TRAIN_WEATHERS)
+    for (start, end) in POSES_TOWN2_STRAIGHT
+]
+
+TOWN2_ONE_CURVE = [
+    build_scenario("Town02", start, end, 0, 0, 600, TRAIN_WEATHERS)
+    for (start, end) in POSES_TOWN2_ONE_CURVE
+]
+
+TOWN2_NAVIGATION = [
+    build_scenario("Town02", start, end, 0, 0, 900, TRAIN_WEATHERS)
+    for (start, end) in POSES_TOWN2_NAV
+]
+
+TOWN2_NAVIGATION_DYNAMIC = [
+    build_scenario("Town02", start, end, 20, 50, 900, TRAIN_WEATHERS)
+    for (start, end) in POSES_TOWN2_NAV
+]
+
+TOWN1_ALL = (TOWN1_STRAIGHT + TOWN1_ONE_CURVE + TOWN1_NAVIGATION +
+             TOWN1_NAVIGATION_DYNAMIC)
+
+TOWN2_ALL = (TOWN2_STRAIGHT + TOWN2_ONE_CURVE + TOWN2_NAVIGATION +
+             TOWN2_NAVIGATION_DYNAMIC)
diff --git a/examples/carla/train_a3c.py b/python/ray/rllib/examples/carla/train_a3c.py
similarity index 84%
rename from examples/carla/train_a3c.py
rename to python/ray/rllib/examples/carla/train_a3c.py
index 75856aef266e0..8fbcfbc576d1e 100644
--- a/examples/carla/train_a3c.py
+++ b/python/ray/rllib/examples/carla/train_a3c.py
@@ -3,13 +3,12 @@
 from __future__ import print_function
 
 import ray
-from ray.tune import grid_search, register_env, run_experiments
+from ray.tune import grid_search, run_experiments
 
 from env import CarlaEnv, ENV_CONFIG
 from models import register_carla_model
 from scenarios import TOWN2_STRAIGHT
 
-env_name = "carla_env"
 env_config = ENV_CONFIG.copy()
 env_config.update({
     "verbose": False,
@@ -23,7 +22,6 @@
     "scenarios": TOWN2_STRAIGHT,
 })
 
-register_env(env_name, lambda env_config: CarlaEnv(env_config))
 register_carla_model()
 redis_address = ray.services.get_node_ip_address() + ":6379"
 
@@ -31,8 +29,7 @@
 run_experiments({
     "carla-a3c": {
         "run": "A3C",
-        "env": "carla_env",
-        "trial_resources": {"cpu": 5, "extra_gpu": 2},
+        "env": CarlaEnv,
         "config": {
             "env_config": env_config,
             "use_gpu_for_workers": True,
diff --git a/examples/carla/train_dqn.py b/python/ray/rllib/examples/carla/train_dqn.py
similarity index 71%
rename from examples/carla/train_dqn.py
rename to python/ray/rllib/examples/carla/train_dqn.py
index 6180ca48f0dda..27aa65444d386 100644
--- a/examples/carla/train_dqn.py
+++ b/python/ray/rllib/examples/carla/train_dqn.py
@@ -3,13 +3,12 @@
 from __future__ import print_function
 
 import ray
-from ray.tune import register_env, run_experiments
+from ray.tune import run_experiments
 
 from env import CarlaEnv, ENV_CONFIG
 from models import register_carla_model
 from scenarios import TOWN2_ONE_CURVE
 
-env_name = "carla_env"
 env_config = ENV_CONFIG.copy()
 env_config.update({
     "verbose": False,
@@ -21,25 +20,29 @@
     "scenarios": TOWN2_ONE_CURVE,
 })
 
-register_env(env_name, lambda env_config: CarlaEnv(env_config))
 register_carla_model()
 
 ray.init()
+
+
+def shape_out(spec):
+    return (spec.config.env_config.framestack *
+            (spec.config.env_config.use_depth_camera and 1 or 3))
+
+
 run_experiments({
     "carla-dqn": {
         "run": "DQN",
-        "env": "carla_env",
-        "trial_resources": {"cpu": 4, "gpu": 1},
+        "env": CarlaEnv,
         "config": {
             "env_config": env_config,
             "model": {
                 "custom_model": "carla",
                 "custom_options": {
                     "image_shape": [
-                        80, 80,
-                        lambda spec: spec.config.env_config.framestack * (
-                            spec.config.env_config.use_depth_camera and 1 or 3
-                        ),
+                        80,
+                        80,
+                        shape_out,
                     ],
                 },
                 "conv_filters": [
@@ -53,7 +56,9 @@
             "schedule_max_timesteps": 100000,
             "gamma": 0.8,
             "tf_session_args": {
-              "gpu_options": {"allow_growth": True},
+                "gpu_options": {
+                    "allow_growth": True
+                },
             },
         },
     },
diff --git a/examples/carla/train_ppo.py b/python/ray/rllib/examples/carla/train_ppo.py
similarity index 70%
rename from examples/carla/train_ppo.py
rename to python/ray/rllib/examples/carla/train_ppo.py
index 4f3ebf5eab830..6c49240142c26 100644
--- a/examples/carla/train_ppo.py
+++ b/python/ray/rllib/examples/carla/train_ppo.py
@@ -3,13 +3,12 @@
 from __future__ import print_function
 
 import ray
-from ray.tune import register_env, run_experiments
+from ray.tune import run_experiments
 
 from env import CarlaEnv, ENV_CONFIG
 from models import register_carla_model
 from scenarios import TOWN2_STRAIGHT
 
-env_name = "carla_env"
 env_config = ENV_CONFIG.copy()
 env_config.update({
     "verbose": False,
@@ -20,22 +19,21 @@
     "server_map": "/Game/Maps/Town02",
     "scenarios": TOWN2_STRAIGHT,
 })
-register_env(env_name, lambda env_config: CarlaEnv(env_config))
 register_carla_model()
 
 ray.init(redirect_output=True)
 run_experiments({
     "carla": {
         "run": "PPO",
-        "env": "carla_env",
-        "trial_resources": {"cpu": 4, "gpu": 1},
+        "env": CarlaEnv,
         "config": {
             "env_config": env_config,
             "model": {
                 "custom_model": "carla",
                 "custom_options": {
                     "image_shape": [
-                        env_config["x_res"], env_config["y_res"], 6],
+                        env_config["x_res"], env_config["y_res"], 6
+                    ],
                 },
                 "conv_filters": [
                     [16, [8, 8], 4],
@@ -44,17 +42,14 @@
                 ],
             },
             "num_workers": 1,
-            "timesteps_per_batch": 2000,
-            "min_steps_per_task": 100,
+            "train_batch_size": 2000,
+            "sample_batch_size": 100,
             "lambda": 0.95,
             "clip_param": 0.2,
             "num_sgd_iter": 20,
-            "sgd_stepsize": 0.0001,
-            "sgd_batchsize": 32,
-            "devices": ["/gpu:0"],
-            "tf_session_args": {
-              "gpu_options": {"allow_growth": True}
-            }
+            "lr": 0.0001,
+            "sgd_minibatch_size": 32,
+            "num_gpus": 1,
         },
     },
 })
diff --git a/python/ray/rllib/examples/cartpole_lstm.py b/python/ray/rllib/examples/cartpole_lstm.py
index e3d0ddc4c5701..ddc89c47e3b34 100644
--- a/python/ray/rllib/examples/cartpole_lstm.py
+++ b/python/ray/rllib/examples/cartpole_lstm.py
@@ -14,6 +14,8 @@
 
 parser = argparse.ArgumentParser()
 parser.add_argument("--stop", type=int, default=200)
+parser.add_argument("--use-prev-action-reward", action="store_true")
+parser.add_argument("--run", type=str, default="PPO")
 
 
 class CartPoleStatelessEnv(gym.Env):
@@ -163,18 +165,32 @@ def close(self):
     tune.register_env("cartpole_stateless", lambda _: CartPoleStatelessEnv())
 
     ray.init()
+
+    configs = {
+        "PPO": {
+            "num_sgd_iter": 5,
+        },
+        "IMPALA": {
+            "num_workers": 2,
+            "num_gpus": 0,
+            "vf_loss_coeff": 0.01,
+        },
+    }
+
     tune.run_experiments({
         "test": {
             "env": "cartpole_stateless",
-            "run": "PPO",
+            "run": args.run,
             "stop": {
                 "episode_reward_mean": args.stop
             },
-            "config": {
-                "num_sgd_iter": 5,
-                "model": {
-                    "use_lstm": True,
-                },
-            },
+            "config": dict(
+                configs[args.run], **{
+                    "model": {
+                        "use_lstm": True,
+                        "lstm_use_prev_action_reward": args.
+                        use_prev_action_reward,
+                    },
+                }),
         }
     })
diff --git a/examples/custom_env/custom_env.py b/python/ray/rllib/examples/custom_env.py
similarity index 81%
rename from examples/custom_env/custom_env.py
rename to python/ray/rllib/examples/custom_env.py
index b5a3240eaad0a..0d96eef6acb64 100644
--- a/examples/custom_env/custom_env.py
+++ b/python/ray/rllib/examples/custom_env.py
@@ -11,7 +11,6 @@
 
 import ray
 from ray.tune import run_experiments
-from ray.tune.registry import register_env
 
 
 class SimpleCorridor(gym.Env):
@@ -24,7 +23,7 @@ def __init__(self, config):
         self.cur_pos = 0
         self.action_space = Discrete(2)
         self.observation_space = Box(
-            0.0, self.end_pos, shape=(1,), dtype=np.float32)
+            0.0, self.end_pos, shape=(1, ), dtype=np.float32)
         self._spec = EnvSpec("SimpleCorridor-{}-v0".format(self.end_pos))
 
     def reset(self):
@@ -32,7 +31,7 @@ def reset(self):
         return [self.cur_pos]
 
     def step(self, action):
-        assert action in [0, 1]
+        assert action in [0, 1], action
         if action == 0 and self.cur_pos > 0:
             self.cur_pos -= 1
         elif action == 1:
@@ -42,13 +41,13 @@ def step(self, action):
 
 
 if __name__ == "__main__":
-    env_creator_name = "corridor"
-    register_env(env_creator_name, lambda config: SimpleCorridor(config))
+    # Can also register the env creator function explicitly with:
+    # register_env("corridor", lambda config: SimpleCorridor(config))
     ray.init()
     run_experiments({
         "demo": {
             "run": "PPO",
-            "env": "corridor",
+            "env": SimpleCorridor,  # or "corridor" if registered above
             "config": {
                 "env_config": {
                     "corridor_length": 5,
diff --git a/python/ray/rllib/examples/custom_metrics_and_callbacks.py b/python/ray/rllib/examples/custom_metrics_and_callbacks.py
new file mode 100644
index 0000000000000..af1d25f16cadf
--- /dev/null
+++ b/python/ray/rllib/examples/custom_metrics_and_callbacks.py
@@ -0,0 +1,77 @@
+"""Example of using RLlib's debug callbacks.
+
+Here we use callbacks to track the average CartPole pole angle magnitude as a
+custom metric.
+"""
+
+import argparse
+import numpy as np
+
+import ray
+from ray import tune
+
+
+def on_episode_start(info):
+    episode = info["episode"]
+    print("episode {} started".format(episode.episode_id))
+    episode.user_data["pole_angles"] = []
+
+
+def on_episode_step(info):
+    episode = info["episode"]
+    pole_angle = abs(episode.last_observation_for()[2])
+    episode.user_data["pole_angles"].append(pole_angle)
+
+
+def on_episode_end(info):
+    episode = info["episode"]
+    pole_angle = np.mean(episode.user_data["pole_angles"])
+    print("episode {} ended with length {} and pole angles {}".format(
+        episode.episode_id, episode.length, pole_angle))
+    episode.custom_metrics["pole_angle"] = pole_angle
+
+
+def on_sample_end(info):
+    print("returned sample batch of size {}".format(info["samples"].count))
+
+
+def on_train_result(info):
+    print("agent.train() result: {} -> {} episodes".format(
+        info["agent"], info["result"]["episodes_this_iter"]))
+    # you can mutate the result dict to add new fields to return
+    info["result"]["callback_ok"] = True
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--num-iters", type=int, default=2000)
+    args = parser.parse_args()
+
+    ray.init()
+    trials = tune.run_experiments({
+        "test": {
+            "env": "CartPole-v0",
+            "run": "PG",
+            "stop": {
+                "training_iteration": args.num_iters,
+            },
+            "config": {
+                "callbacks": {
+                    "on_episode_start": tune.function(on_episode_start),
+                    "on_episode_step": tune.function(on_episode_step),
+                    "on_episode_end": tune.function(on_episode_end),
+                    "on_sample_end": tune.function(on_sample_end),
+                    "on_train_result": tune.function(on_train_result),
+                },
+            },
+        }
+    })
+
+    # verify custom metrics for integration tests
+    custom_metrics = trials[0].last_result["custom_metrics"]
+    print(custom_metrics)
+    assert "pole_angle_mean" in custom_metrics
+    assert "pole_angle_min" in custom_metrics
+    assert "pole_angle_max" in custom_metrics
+    assert type(custom_metrics["pole_angle_mean"]) is float
+    assert "callback_ok" in trials[0].last_result
diff --git a/python/ray/rllib/examples/legacy_multiagent/multiagent_mountaincar.py b/python/ray/rllib/examples/legacy_multiagent/multiagent_mountaincar.py
deleted file mode 100644
index 9559648290dae..0000000000000
--- a/python/ray/rllib/examples/legacy_multiagent/multiagent_mountaincar.py
+++ /dev/null
@@ -1,59 +0,0 @@
-""" Multiagent mountain car. Each agent outputs an action which
-is summed to form the total action. This is a discrete
-multiagent example
-"""
-
-import gym
-from gym.envs.registration import register
-
-import ray
-import ray.rllib.agents.ppo as ppo
-from ray.tune.registry import register_env
-
-env_name = "MultiAgentMountainCarEnv"
-
-env_version_num = 0
-env_name = env_name + '-v' + str(env_version_num)
-
-
-def pass_params_to_gym(env_name):
-    global env_version_num
-
-    register(
-        id=env_name,
-        entry_point=(
-            "ray.rllib.examples.legacy_multiagent.multiagent_mountaincar_env:"
-            "MultiAgentMountainCarEnv"),
-        max_episode_steps=200,
-        kwargs={})
-
-
-def create_env(env_config):
-    pass_params_to_gym(env_name)
-    env = gym.envs.make(env_name)
-    return env
-
-
-if __name__ == '__main__':
-    register_env(env_name, lambda env_config: create_env(env_config))
-    config = ppo.DEFAULT_CONFIG.copy()
-    horizon = 10
-    num_cpus = 4
-    ray.init(num_cpus=num_cpus, redirect_output=True)
-    config["num_workers"] = num_cpus
-    config["train_batch_size"] = 1000
-    config["num_sgd_iter"] = 10
-    config["gamma"] = 0.999
-    config["horizon"] = horizon
-    config["use_gae"] = False
-    config["model"].update({"fcnet_hiddens": [256, 256]})
-    options = {
-        "multiagent_obs_shapes": [2, 2],
-        "multiagent_act_shapes": [1, 1],
-        "multiagent_shared_model": False,
-        "multiagent_fcnet_hiddens": [[32, 32]] * 2
-    }
-    config["model"].update({"custom_options": options})
-    alg = ppo.PPOAgent(env=env_name, config=config)
-    for i in range(1):
-        alg.train()
diff --git a/python/ray/rllib/examples/legacy_multiagent/multiagent_mountaincar_env.py b/python/ray/rllib/examples/legacy_multiagent/multiagent_mountaincar_env.py
deleted file mode 100644
index c120f00c99ec7..0000000000000
--- a/python/ray/rllib/examples/legacy_multiagent/multiagent_mountaincar_env.py
+++ /dev/null
@@ -1,51 +0,0 @@
-from math import cos
-from gym.spaces import Box, Tuple, Discrete
-import numpy as np
-from gym.envs.classic_control.mountain_car import MountainCarEnv
-"""
-Multiagent mountain car that sums and then
-averages its actions to produce the velocity
-"""
-
-
-class MultiAgentMountainCarEnv(MountainCarEnv):
-    def __init__(self):
-        self.min_position = -1.2
-        self.max_position = 0.6
-        self.max_speed = 0.07
-        self.goal_position = 0.5
-
-        self.low = np.array([self.min_position, -self.max_speed])
-        self.high = np.array([self.max_position, self.max_speed])
-
-        self.viewer = None
-
-        self.action_space = [Discrete(3) for _ in range(2)]
-        self.observation_space = Tuple(
-            [Box(self.low, self.high, dtype=np.float32) for _ in range(2)])
-
-        self.seed()
-        self.reset()
-
-    def step(self, action):
-        summed_act = 0.5 * np.sum(action)
-
-        position, velocity = self.state
-        velocity += (summed_act - 1) * 0.001
-        velocity += cos(3 * position) * (-0.0025)
-        velocity = np.clip(velocity, -self.max_speed, self.max_speed)
-        position += velocity
-        position = np.clip(position, self.min_position, self.max_position)
-        if (position == self.min_position and velocity < 0):
-            velocity = 0
-
-        done = bool(position >= self.goal_position)
-
-        reward = position
-
-        self.state = (position, velocity)
-        return [np.array(self.state) for _ in range(2)], reward, done, {}
-
-    def reset(self):
-        self.state = np.array([self.np_random.uniform(low=-0.6, high=-0.4), 0])
-        return [np.array(self.state) for _ in range(2)]
diff --git a/python/ray/rllib/examples/legacy_multiagent/multiagent_pendulum.py b/python/ray/rllib/examples/legacy_multiagent/multiagent_pendulum.py
deleted file mode 100644
index b183ff2c0b157..0000000000000
--- a/python/ray/rllib/examples/legacy_multiagent/multiagent_pendulum.py
+++ /dev/null
@@ -1,60 +0,0 @@
-""" Run script for multiagent pendulum env. Each agent outputs a
-torque which is summed to form the total torque. This is a
-continuous multiagent example
-"""
-
-import gym
-from gym.envs.registration import register
-
-import ray
-import ray.rllib.agents.ppo as ppo
-from ray.tune.registry import register_env
-
-env_name = "MultiAgentPendulumEnv"
-
-env_version_num = 0
-env_name = env_name + '-v' + str(env_version_num)
-
-
-def pass_params_to_gym(env_name):
-    global env_version_num
-
-    register(
-        id=env_name,
-        entry_point=(
-            "ray.rllib.examples.legacy_multiagent.multiagent_pendulum_env:"
-            "MultiAgentPendulumEnv"),
-        max_episode_steps=100,
-        kwargs={})
-
-
-def create_env(env_config):
-    pass_params_to_gym(env_name)
-    env = gym.envs.make(env_name)
-    return env
-
-
-if __name__ == '__main__':
-    register_env(env_name, lambda env_config: create_env(env_config))
-    config = ppo.DEFAULT_CONFIG.copy()
-    horizon = 10
-    num_cpus = 4
-    ray.init(num_cpus=num_cpus, redirect_output=True)
-    config["num_workers"] = num_cpus
-    config["train_batch_size"] = 1000
-    config["sgd_minibatch_size"] = 10
-    config["num_sgd_iter"] = 10
-    config["gamma"] = 0.999
-    config["horizon"] = horizon
-    config["use_gae"] = True
-    config["model"].update({"fcnet_hiddens": [256, 256]})
-    options = {
-        "multiagent_obs_shapes": [3, 3],
-        "multiagent_act_shapes": [1, 1],
-        "multiagent_shared_model": True,
-        "multiagent_fcnet_hiddens": [[32, 32]] * 2
-    }
-    config["model"].update({"custom_options": options})
-    alg = ppo.PPOAgent(env=env_name, config=config)
-    for i in range(1):
-        alg.train()
diff --git a/python/ray/rllib/examples/legacy_multiagent/multiagent_pendulum_env.py b/python/ray/rllib/examples/legacy_multiagent/multiagent_pendulum_env.py
deleted file mode 100644
index 02645832729f7..0000000000000
--- a/python/ray/rllib/examples/legacy_multiagent/multiagent_pendulum_env.py
+++ /dev/null
@@ -1,74 +0,0 @@
-from gym.spaces import Box, Tuple
-from gym.utils import seeding
-from gym.envs.classic_control.pendulum import PendulumEnv
-import numpy as np
-"""
- Multiagent pendulum that sums its torques to generate an action
-"""
-
-
-class MultiAgentPendulumEnv(PendulumEnv):
-    metadata = {
-        'render.modes': ['human', 'rgb_array'],
-        'video.frames_per_second': 30
-    }
-
-    def __init__(self):
-        self.max_speed = 8
-        self.max_torque = 2.
-        self.dt = .05
-        self.viewer = None
-
-        high = np.array([1., 1., self.max_speed])
-        self.action_space = [
-            Box(low=-self.max_torque / 2,
-                high=self.max_torque / 2,
-                shape=(1, ),
-                dtype=np.float32) for _ in range(2)
-        ]
-        self.observation_space = Tuple(
-            [Box(low=-high, high=high, dtype=np.float32) for _ in range(2)])
-
-        self.seed()
-
-    def seed(self, seed=None):
-        self.np_random, seed = seeding.np_random(seed)
-        return [seed]
-
-    def step(self, u):
-        th, thdot = self.state  # th := theta
-
-        summed_u = np.sum(u)
-        g = 10.
-        m = 1.
-        length = 1.
-        dt = self.dt
-
-        summed_u = np.clip(summed_u, -self.max_torque, self.max_torque)
-        self.last_u = summed_u  # for rendering
-        costs = self.angle_normalize(th) ** 2 + .1 * thdot ** 2 + \
-            .001 * (summed_u ** 2)
-
-        newthdot = thdot + (-3 * g / (2 * length) * np.sin(th + np.pi) + 3. /
-                            (m * length**2) * summed_u) * dt
-        newth = th + newthdot * dt
-        newthdot = np.clip(newthdot, -self.max_speed, self.max_speed)
-
-        self.state = np.array([newth, newthdot])
-        return self._get_obs(), -costs, False, {}
-
-    def reset(self):
-        high = np.array([np.pi, 1])
-        self.state = self.np_random.uniform(low=-high, high=high)
-        self.last_u = None
-        return self._get_obs()
-
-    def _get_obs(self):
-        theta, thetadot = self.state
-        return [
-            np.array([np.cos(theta), np.sin(theta), thetadot])
-            for _ in range(2)
-        ]
-
-    def angle_normalize(self, x):
-        return (((x + np.pi) % (2 * np.pi)) - np.pi)
diff --git a/python/ray/rllib/examples/multiagent_cartpole.py b/python/ray/rllib/examples/multiagent_cartpole.py
index 8faeb184bf6d7..e2ab5270f9d87 100644
--- a/python/ray/rllib/examples/multiagent_cartpole.py
+++ b/python/ray/rllib/examples/multiagent_cartpole.py
@@ -16,9 +16,13 @@
 import gym
 import random
 
+import tensorflow as tf
+import tensorflow.contrib.slim as slim
+
 import ray
 from ray import tune
-from ray.rllib.agents.pg.pg_policy_graph import PGPolicyGraph
+from ray.rllib.agents.ppo.ppo_policy_graph import PPOPolicyGraph
+from ray.rllib.models import Model, ModelCatalog
 from ray.rllib.test.test_multi_agent_env import MultiCartpole
 from ray.tune import run_experiments
 from ray.tune.registry import register_env
@@ -29,38 +33,82 @@
 parser.add_argument("--num-policies", type=int, default=2)
 parser.add_argument("--num-iters", type=int, default=20)
 
+
+class CustomModel1(Model):
+    def _build_layers_v2(self, input_dict, num_outputs, options):
+        # Example of (optional) weight sharing between two different policies.
+        # Here, we share the variables defined in the 'shared' variable scope
+        # by entering it explicitly with tf.AUTO_REUSE. This creates the
+        # variables for the 'fc1' layer in a global scope called 'shared'
+        # outside of the policy's normal variable scope.
+        with tf.variable_scope(
+                tf.VariableScope(tf.AUTO_REUSE, "shared"),
+                reuse=tf.AUTO_REUSE,
+                auxiliary_name_scope=False):
+            last_layer = slim.fully_connected(
+                input_dict["obs"], 64, activation_fn=tf.nn.relu, scope="fc1")
+        last_layer = slim.fully_connected(
+            last_layer, 64, activation_fn=tf.nn.relu, scope="fc2")
+        output = slim.fully_connected(
+            last_layer, num_outputs, activation_fn=None, scope="fc_out")
+        return output, last_layer
+
+
+class CustomModel2(Model):
+    def _build_layers_v2(self, input_dict, num_outputs, options):
+        # Weights shared with CustomModel1
+        with tf.variable_scope(
+                tf.VariableScope(tf.AUTO_REUSE, "shared"),
+                reuse=tf.AUTO_REUSE,
+                auxiliary_name_scope=False):
+            last_layer = slim.fully_connected(
+                input_dict["obs"], 64, activation_fn=tf.nn.relu, scope="fc1")
+        last_layer = slim.fully_connected(
+            last_layer, 64, activation_fn=tf.nn.relu, scope="fc2")
+        output = slim.fully_connected(
+            last_layer, num_outputs, activation_fn=None, scope="fc_out")
+        return output, last_layer
+
+
 if __name__ == "__main__":
     args = parser.parse_args()
     ray.init()
 
     # Simple environment with `num_agents` independent cartpole entities
     register_env("multi_cartpole", lambda _: MultiCartpole(args.num_agents))
+    ModelCatalog.register_custom_model("model1", CustomModel1)
+    ModelCatalog.register_custom_model("model2", CustomModel2)
     single_env = gym.make("CartPole-v0")
     obs_space = single_env.observation_space
     act_space = single_env.action_space
 
-    def gen_policy():
+    # Each policy can have a different configuration (including custom model)
+    def gen_policy(i):
         config = {
-            "gamma": random.choice([0.5, 0.8, 0.9, 0.95, 0.99]),
-            "n_step": random.choice([1, 2, 3, 4, 5]),
+            "model": {
+                "custom_model": ["model1", "model2"][i % 2],
+            },
+            "gamma": random.choice([0.95, 0.99]),
         }
-        return (PGPolicyGraph, obs_space, act_space, config)
+        return (PPOPolicyGraph, obs_space, act_space, config)
 
-    # Setup PG with an ensemble of `num_policies` different policy graphs
+    # Setup PPO with an ensemble of `num_policies` different policy graphs
     policy_graphs = {
-        "policy_{}".format(i): gen_policy()
+        "policy_{}".format(i): gen_policy(i)
         for i in range(args.num_policies)
     }
     policy_ids = list(policy_graphs.keys())
 
     run_experiments({
         "test": {
-            "run": "PG",
+            "run": "PPO",
             "env": "multi_cartpole",
             "stop": {
                 "training_iteration": args.num_iters
             },
             "config": {
+                "log_level": "DEBUG",
+                "num_sgd_iter": 10,
                 "multiagent": {
                     "policy_graphs": policy_graphs,
                     "policy_mapping_fn": tune.function(
diff --git a/python/ray/rllib/examples/multiagent_two_trainers.py b/python/ray/rllib/examples/multiagent_two_trainers.py
index e2c8bc97a8c23..46831db452b6d 100644
--- a/python/ray/rllib/examples/multiagent_two_trainers.py
+++ b/python/ray/rllib/examples/multiagent_two_trainers.py
@@ -57,7 +57,6 @@ def policy_mapping_fn(agent_id):
                 "policy_mapping_fn": policy_mapping_fn,
                 "policies_to_train": ["ppo_policy"],
             },
-            "simple_optimizer": True,
             # disable filters, otherwise we would need to synchronize those
             # as well to the DQN agent
             "observation_filter": "NoFilter",
diff --git a/python/ray/rllib/examples/parametric_action_cartpole.py b/python/ray/rllib/examples/parametric_action_cartpole.py
new file mode 100644
index 0000000000000..a1438f0a24123
--- /dev/null
+++ b/python/ray/rllib/examples/parametric_action_cartpole.py
@@ -0,0 +1,196 @@
+"""Example of handling variable length and/or parametric action spaces.
+
+This is a toy example of the action-embedding based approach for handling large
+discrete action spaces (potentially infinite in size), similar to how
+OpenAI Five works:
+
+    https://neuro.cs.ut.ee/the-use-of-embeddings-in-openai-five/
+
+This currently works with RLlib's policy gradient style algorithms
+(e.g., PG, PPO, IMPALA, A2C) and also DQN.
+
+Note that since the model outputs now include "-inf" tf.float32.min
+values, not all algorithm options are supported at the moment. For example,
+algorithms might crash if they don't properly ignore the -inf action scores.
+Working configurations are given below.
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import argparse
+import random
+import numpy as np
+import gym
+from gym.spaces import Box, Discrete, Dict
+import tensorflow as tf
+import tensorflow.contrib.slim as slim
+
+import ray
+from ray.rllib.models import Model, ModelCatalog
+from ray.rllib.models.misc import normc_initializer
+from ray.tune import run_experiments
+from ray.tune.registry import register_env
+
+parser = argparse.ArgumentParser()
+parser.add_argument("--stop", type=int, default=200)
+parser.add_argument("--run", type=str, default="PPO")
+
+
+class ParametricActionCartpole(gym.Env):
+    """Parametric action version of CartPole.
+
+    In this env there are only ever two valid actions, but we pretend there are
+    actually up to `max_avail_actions` actions that can be taken, and the two
+    valid actions are randomly hidden among this set.
+
+    At each step, we emit a dict of:
+        - the actual cart observation
+        - a mask of valid actions (e.g., [0, 0, 1, 0, 0, 1] for 6 max avail)
+        - the list of action embeddings (w/ zeroes for invalid actions) (e.g.,
+            [[0, 0],
+             [0, 0],
+             [-0.2322, -0.2569],
+             [0, 0],
+             [0, 0],
+             [0.7878, 1.2297]] for max_avail_actions=6)
+
+    In a real environment, the actions embeddings would be larger than two
+    units of course, and also there would be a variable number of valid actions
+    per step instead of always [LEFT, RIGHT].
+    """
+
+    def __init__(self, max_avail_actions):
+        # Use simple random 2-unit action embeddings for [LEFT, RIGHT]
+        self.left_action_embed = np.random.randn(2)
+        self.right_action_embed = np.random.randn(2)
+        self.action_space = Discrete(max_avail_actions)
+        self.wrapped = gym.make("CartPole-v0")
+        self.observation_space = Dict({
+            "action_mask": Box(0, 1, shape=(max_avail_actions, )),
+            "avail_actions": Box(-1, 1, shape=(max_avail_actions, 2)),
+            "cart": self.wrapped.observation_space,
+        })
+
+    def update_avail_actions(self):
+        self.action_assignments = [[0, 0]] * self.action_space.n
+        self.action_mask = [0] * self.action_space.n
+        self.left_idx, self.right_idx = random.sample(
+            range(self.action_space.n), 2)
+        self.action_assignments[self.left_idx] = self.left_action_embed
+        self.action_assignments[self.right_idx] = self.right_action_embed
+        self.action_mask[self.left_idx] = 1
+        self.action_mask[self.right_idx] = 1
+
+    def reset(self):
+        self.update_avail_actions()
+        return {
+            "action_mask": self.action_mask,
+            "avail_actions": self.action_assignments,
+            "cart": self.wrapped.reset(),
+        }
+
+    def step(self, action):
+        if action == self.left_idx:
+            actual_action = 0
+        elif action == self.right_idx:
+            actual_action = 1
+        else:
+            raise ValueError(
+                "Chosen action was not one of the non-zero action embeddings",
+                action, self.action_assignments, self.action_mask,
+                self.left_idx, self.right_idx)
+        orig_obs, rew, done, info = self.wrapped.step(actual_action)
+        self.update_avail_actions()
+        obs = {
+            "action_mask": self.action_mask,
+            "avail_actions": self.action_assignments,
+            "cart": orig_obs,
+        }
+        return obs, rew, done, info
+
+
+class ParametricActionsModel(Model):
+    """Parametric action model that handles the dot product and masking.
+
+    This assumes the outputs are logits for a single Categorical action dist.
+    Getting this to work with a more complex output (e.g., if the action space
+    is a tuple of several distributions) is also possible but left as an
+    exercise to the reader.
+    """
+
+    def _build_layers_v2(self, input_dict, num_outputs, options):
+        # Extract the available actions tensor from the observation.
+        avail_actions = input_dict["obs"]["avail_actions"]
+        action_mask = input_dict["obs"]["action_mask"]
+        action_embed_size = avail_actions.shape[2].value
+        if num_outputs != avail_actions.shape[1].value:
+            raise ValueError(
+                "This model assumes num outputs is equal to max avail actions",
+                num_outputs, avail_actions)
+
+        # Standard FC net component.
+        last_layer = input_dict["obs"]["cart"]
+        hiddens = [256, 256]
+        for i, size in enumerate(hiddens):
+            label = "fc{}".format(i)
+            last_layer = slim.fully_connected(
+                last_layer,
+                size,
+                weights_initializer=normc_initializer(1.0),
+                activation_fn=tf.nn.tanh,
+                scope=label)
+        output = slim.fully_connected(
+            last_layer,
+            action_embed_size,
+            weights_initializer=normc_initializer(0.01),
+            activation_fn=None,
+            scope="fc_out")
+
+        # Expand the model output to [BATCH, 1, EMBED_SIZE]. Note that the
+        # avail actions tensor is of shape [BATCH, MAX_ACTIONS, EMBED_SIZE].
+        intent_vector = tf.expand_dims(output, 1)
+
+        # Batch dot product => shape of logits is [BATCH, MAX_ACTIONS].
+        action_logits = tf.reduce_sum(avail_actions * intent_vector, axis=2)
+
+        # Mask out invalid actions (use tf.float32.min for stability)
+        inf_mask = tf.maximum(tf.log(action_mask), tf.float32.min)
+        masked_logits = inf_mask + action_logits
+
+        return masked_logits, last_layer
+
+
+if __name__ == "__main__":
+    args = parser.parse_args()
+    ray.init()
+
+    ModelCatalog.register_custom_model("pa_model", ParametricActionsModel)
+    register_env("pa_cartpole", lambda _: ParametricActionCartpole(10))
+    if args.run == "PPO":
+        cfg = {
+            "observation_filter": "NoFilter",  # don't filter the action list
+            "vf_share_layers": True,  # don't create duplicate value model
+        }
+    elif args.run == "DQN":
+        cfg = {
+            "hiddens": [],  # don't postprocess the action scores
+        }
+    else:
+        cfg = {}
+    run_experiments({
+        "parametric_cartpole": {
+            "run": args.run,
+            "env": "pa_cartpole",
+            "stop": {
+                "episode_reward_mean": args.stop,
+            },
+            "config": dict({
+                "model": {
+                    "custom_model": "pa_model",
+                },
+                "num_workers": 0,
+            }, **cfg),
+        },
+    })
diff --git a/python/ray/rllib/examples/serving/cartpole_client.py b/python/ray/rllib/examples/serving/cartpole_client.py
index 6f6a2e189c69a..b116eb9aa356b 100755
--- a/python/ray/rllib/examples/serving/cartpole_client.py
+++ b/python/ray/rllib/examples/serving/cartpole_client.py
@@ -29,7 +29,7 @@
 if __name__ == "__main__":
     args = parser.parse_args()
     env = gym.make("CartPole-v0")
-    client = PolicyClient("http://localhost:8900")
+    client = PolicyClient("http://localhost:9900")
 
     eid = client.start_episode(training_enabled=not args.no_train)
     obs = env.reset()
diff --git a/python/ray/rllib/examples/serving/cartpole_server.py b/python/ray/rllib/examples/serving/cartpole_server.py
index dbbdf85809ff8..40260350ca3dd 100755
--- a/python/ray/rllib/examples/serving/cartpole_server.py
+++ b/python/ray/rllib/examples/serving/cartpole_server.py
@@ -14,19 +14,19 @@
 
 import ray
 from ray.rllib.agents.dqn import DQNAgent
-from ray.rllib.env.serving_env import ServingEnv
+from ray.rllib.env.external_env import ExternalEnv
 from ray.rllib.utils.policy_server import PolicyServer
 from ray.tune.logger import pretty_print
 from ray.tune.registry import register_env
 
 SERVER_ADDRESS = "localhost"
-SERVER_PORT = 8900
+SERVER_PORT = 9900
 CHECKPOINT_FILE = "last_checkpoint.out"
 
 
-class CartpoleServing(ServingEnv):
+class CartpoleServing(ExternalEnv):
     def __init__(self):
-        ServingEnv.__init__(
+        ExternalEnv.__init__(
             self, spaces.Discrete(2),
             spaces.Box(low=-10, high=10, shape=(4, ), dtype=np.float32))
 
diff --git a/python/ray/rllib/examples/serving/test.sh b/python/ray/rllib/examples/serving/test.sh
index d443a44a43223..d1dfa1e899c57 100755
--- a/python/ray/rllib/examples/serving/test.sh
+++ b/python/ray/rllib/examples/serving/test.sh
@@ -4,7 +4,7 @@ pkill -f cartpole_server.py
 (python cartpole_server.py 2>&1 | grep -v 200) &
 pid=$!
 
-while ! curl localhost:8900; do   
+while ! curl localhost:9900; do   
   sleep 1
 done
 
diff --git a/python/ray/rllib/models/__init__.py b/python/ray/rllib/models/__init__.py
index ddfdd16b8ba18..52e47e807b3ff 100644
--- a/python/ray/rllib/models/__init__.py
+++ b/python/ray/rllib/models/__init__.py
@@ -1,4 +1,4 @@
-from ray.rllib.models.catalog import ModelCatalog
+from ray.rllib.models.catalog import ModelCatalog, MODEL_DEFAULTS
 from ray.rllib.models.action_dist import (ActionDistribution, Categorical,
                                           DiagGaussian, Deterministic)
 from ray.rllib.models.model import Model
@@ -7,6 +7,14 @@
 from ray.rllib.models.lstm import LSTM
 
 __all__ = [
-    "ActionDistribution", "Categorical", "DiagGaussian", "Deterministic",
-    "ModelCatalog", "Model", "Preprocessor", "FullyConnectedNetwork", "LSTM"
+    "ActionDistribution",
+    "Categorical",
+    "DiagGaussian",
+    "Deterministic",
+    "ModelCatalog",
+    "Model",
+    "Preprocessor",
+    "FullyConnectedNetwork",
+    "LSTM",
+    "MODEL_DEFAULTS",
 ]
diff --git a/python/ray/rllib/models/action_dist.py b/python/ray/rllib/models/action_dist.py
index b0cfe4141af16..f2a69efaf9b03 100644
--- a/python/ray/rllib/models/action_dist.py
+++ b/python/ray/rllib/models/action_dist.py
@@ -2,9 +2,12 @@
 from __future__ import division
 from __future__ import print_function
 
+from collections import namedtuple
+import distutils.version
 import tensorflow as tf
 import numpy as np
-import distutils.version
+
+from ray.rllib.utils.annotations import override
 
 use_tf150_api = (distutils.version.LooseVersion(tf.VERSION) >=
                  distutils.version.LooseVersion("1.5.0"))
@@ -40,10 +43,12 @@ def sample(self):
 class Categorical(ActionDistribution):
     """Categorical distribution for discrete action spaces."""
 
+    @override(ActionDistribution)
     def logp(self, x):
         return -tf.nn.sparse_softmax_cross_entropy_with_logits(
             logits=self.inputs, labels=x)
 
+    @override(ActionDistribution)
     def entropy(self):
         if use_tf150_api:
             a0 = self.inputs - tf.reduce_max(
@@ -59,6 +64,7 @@ def entropy(self):
         p0 = ea0 / z0
         return tf.reduce_sum(p0 * (tf.log(z0) - a0), reduction_indices=[1])
 
+    @override(ActionDistribution)
     def kl(self, other):
         if use_tf150_api:
             a0 = self.inputs - tf.reduce_max(
@@ -82,6 +88,7 @@ def kl(self, other):
         return tf.reduce_sum(
             p0 * (a0 - tf.log(z0) - a1 + tf.log(z1)), reduction_indices=[1])
 
+    @override(ActionDistribution)
     def sample(self):
         return tf.squeeze(tf.multinomial(self.inputs, 1), axis=1)
 
@@ -93,28 +100,21 @@ class DiagGaussian(ActionDistribution):
     second half the gaussian standard deviations.
     """
 
-    def __init__(self, inputs, low=None, high=None):
+    def __init__(self, inputs):
         ActionDistribution.__init__(self, inputs)
         mean, log_std = tf.split(inputs, 2, axis=1)
         self.mean = mean
-        self.low = low
-        self.high = high
-
-        # Squash to range if specified.
-        # TODO(ekl) might make sense to use a beta distribution instead:
-        # http://proceedings.mlr.press/v70/chou17a/chou17a.pdf
-        if low is not None:
-            self.mean = low + tf.sigmoid(self.mean) * (high - low)
-
         self.log_std = log_std
         self.std = tf.exp(log_std)
 
+    @override(ActionDistribution)
     def logp(self, x):
         return (-0.5 * tf.reduce_sum(
             tf.square((x - self.mean) / self.std), reduction_indices=[1]) -
                 0.5 * np.log(2.0 * np.pi) * tf.to_float(tf.shape(x)[1]) -
                 tf.reduce_sum(self.log_std, reduction_indices=[1]))
 
+    @override(ActionDistribution)
     def kl(self, other):
         assert isinstance(other, DiagGaussian)
         return tf.reduce_sum(
@@ -123,16 +123,15 @@ def kl(self, other):
             (2.0 * tf.square(other.std)) - 0.5,
             reduction_indices=[1])
 
+    @override(ActionDistribution)
     def entropy(self):
         return tf.reduce_sum(
             .5 * self.log_std + .5 * np.log(2.0 * np.pi * np.e),
             reduction_indices=[1])
 
+    @override(ActionDistribution)
     def sample(self):
-        out = self.mean + self.std * tf.random_normal(tf.shape(self.mean))
-        if self.low is not None:
-            out = tf.clip_by_value(out, self.low, self.high)
-        return out
+        return self.mean + self.std * tf.random_normal(tf.shape(self.mean))
 
 
 class Deterministic(ActionDistribution):
@@ -141,38 +140,11 @@ class Deterministic(ActionDistribution):
     This is similar to DiagGaussian with standard deviation zero.
     """
 
+    @override(ActionDistribution)
     def sample(self):
         return self.inputs
 
 
-def squash_to_range(dist_cls, low, high):
-    """Squashes an action distribution to a range in (low, high).
-
-    Arguments:
-        dist_cls (class): ActionDistribution class to wrap.
-        low (float|array): Scalar value or array of values.
-        high (float|array): Scalar value or array of values.
-    """
-
-    class SquashToRangeWrapper(dist_cls):
-        def __init__(self, inputs):
-            dist_cls.__init__(self, inputs, low=low, high=high)
-
-        def logp(self, x):
-            return dist_cls.logp(self, x)
-
-        def kl(self, other):
-            return dist_cls.kl(self, other)
-
-        def entropy(self):
-            return dist_cls.entropy(self)
-
-        def sample(self):
-            return dist_cls.sample(self)
-
-    return SquashToRangeWrapper
-
-
 class MultiActionDistribution(ActionDistribution):
     """Action distribution that operates for list of actions.
 
@@ -188,8 +160,8 @@ def __init__(self, inputs, action_space, child_distributions, input_lens):
             child_list.append(distribution(split_inputs[i]))
         self.child_distributions = child_list
 
+    @override(ActionDistribution)
     def logp(self, x):
-        """The log-likelihood of the action distribution."""
         split_indices = []
         for dist in self.child_distributions:
             if isinstance(dist, Categorical):
@@ -208,8 +180,8 @@ def logp(self, x):
         ])
         return np.sum(log_list)
 
+    @override(ActionDistribution)
     def kl(self, other):
-        """The KL-divergence between two action distributions."""
         kl_list = np.asarray([
             distribution.kl(other_distribution)
             for distribution, other_distribution in zip(
@@ -217,12 +189,15 @@ def kl(self, other):
         ])
         return np.sum(kl_list)
 
+    @override(ActionDistribution)
     def entropy(self):
-        """The entropy of the action distribution."""
         entropy_list = np.array(
             [s.entropy() for s in self.child_distributions])
         return np.sum(entropy_list)
 
+    @override(ActionDistribution)
     def sample(self):
-        """Draw a sample from the action distribution."""
-        return [[s.sample() for s in self.child_distributions]]
+        return TupleActions([s.sample() for s in self.child_distributions])
+
+
+TupleActions = namedtuple("TupleActions", ["batches"])
diff --git a/python/ray/rllib/models/catalog.py b/python/ray/rllib/models/catalog.py
index b98061fdd02a4..822af4a37e66f 100644
--- a/python/ray/rllib/models/catalog.py
+++ b/python/ray/rllib/models/catalog.py
@@ -3,6 +3,7 @@
 from __future__ import print_function
 
 import gym
+import logging
 import numpy as np
 import tensorflow as tf
 from functools import partial
@@ -10,38 +11,67 @@
 from ray.tune.registry import RLLIB_MODEL, RLLIB_PREPROCESSOR, \
     _global_registry
 
+from ray.rllib.env.async_vector_env import _ExternalEnvToAsync
+from ray.rllib.env.external_env import ExternalEnv
+from ray.rllib.env.vector_env import VectorEnv
 from ray.rllib.models.action_dist import (
-    Categorical, Deterministic, DiagGaussian, MultiActionDistribution,
-    squash_to_range)
+    Categorical, Deterministic, DiagGaussian, MultiActionDistribution)
 from ray.rllib.models.preprocessors import get_preprocessor
 from ray.rllib.models.fcnet import FullyConnectedNetwork
 from ray.rllib.models.visionnet import VisionNetwork
 from ray.rllib.models.lstm import LSTM
-from ray.rllib.models.multiagentfcnet import MultiAgentFullyConnectedNetwork
 
-MODEL_CONFIGS = [
+logger = logging.getLogger(__name__)
+
+# yapf: disable
+# __sphinx_doc_begin__
+MODEL_DEFAULTS = {
     # === Built-in options ===
     # Filter config. List of [out_channels, kernel, stride] for each filter
-    "conv_filters",
-    "conv_activation",  # Nonlinearity for built-in convnet
-    "fcnet_activation",  # Nonlinearity for fully connected net (tanh, relu)
-    "fcnet_hiddens",  # Number of hidden layers for fully connected net
-    "dim",  # Dimension for ATARI
-    "grayscale",  # Converts ATARI frame to 1 Channel Grayscale image
-    "zero_mean",  # Changes frame to range from [-1, 1] if true
-    "extra_frameskip",  # (int) for number of frames to skip
-    "free_log_std",  # Documented in ray.rllib.models.Model
-    "channel_major",  # Pytorch conv requires images to be channel-major
-    "squash_to_range",  # Whether to squash the action output to space range
-    "use_lstm",  # Whether to wrap the model with a LSTM
-    "max_seq_len",  # Max seq len for training the LSTM, defaults to 20
-    "lstm_cell_size",  # Size of the LSTM cell
+    "conv_filters": None,
+    # Nonlinearity for built-in convnet
+    "conv_activation": "relu",
+    # Nonlinearity for fully connected net (tanh, relu)
+    "fcnet_activation": "tanh",
+    # Number of hidden layers for fully connected net
+    "fcnet_hiddens": [256, 256],
+    # For control envs, documented in ray.rllib.models.Model
+    "free_log_std": False,
+    # (deprecated) Whether to use sigmoid to squash actions to space range
+    "squash_to_range": False,
+
+    # == LSTM ==
+    # Whether to wrap the model with a LSTM
+    "use_lstm": False,
+    # Max seq len for training the LSTM, defaults to 20
+    "max_seq_len": 20,
+    # Size of the LSTM cell
+    "lstm_cell_size": 256,
+    # Whether to feed a_{t-1}, r_{t-1} to LSTM
+    "lstm_use_prev_action_reward": False,
+
+    # == Atari ==
+    # Whether to enable framestack for Atari envs
+    "framestack": True,
+    # Final resized frame dimension
+    "dim": 84,
+    # Pytorch conv requires images to be channel-major
+    "channel_major": False,
+    # (deprecated) Converts ATARI frame to 1 Channel Grayscale image
+    "grayscale": False,
+    # (deprecated) Changes frame to range from [-1, 1] if true
+    "zero_mean": True,
 
     # === Options for custom models ===
-    "custom_preprocessor",  # Name of a custom preprocessor to use
-    "custom_model",  # Name of a custom model to use
-    "custom_options",  # Extra options to pass to the custom classes
-]
+    # Name of a custom preprocessor to use
+    "custom_preprocessor": None,
+    # Name of a custom model to use
+    "custom_model": None,
+    # Extra options to pass to the custom classes
+    "custom_options": {},
+}
+# __sphinx_doc_end__
+# yapf: enable
 
 
 class ModelCatalog(object):
@@ -51,14 +81,15 @@ class ModelCatalog(object):
         >>> prep = ModelCatalog.get_preprocessor(env)
         >>> observation = prep.transform(raw_observation)
 
-        >>> dist_cls, dist_dim = ModelCatalog.get_action_dist(env.action_space)
-        >>> model = ModelCatalog.get_model(inputs, dist_dim)
+        >>> dist_cls, dist_dim = ModelCatalog.get_action_dist(
+                env.action_space, {})
+        >>> model = ModelCatalog.get_model(inputs, dist_dim, options)
         >>> dist = dist_cls(model.outputs)
         >>> action = dist.sample()
     """
 
     @staticmethod
-    def get_action_dist(action_space, config=None, dist_type=None):
+    def get_action_dist(action_space, config, dist_type=None):
         """Returns action distribution class and size for the given action space.
 
         Args:
@@ -71,18 +102,22 @@ def get_action_dist(action_space, config=None, dist_type=None):
             dist_dim (int): The size of the input vector to the distribution.
         """
 
-        # TODO(ekl) are list spaces valid?
-        if isinstance(action_space, list):
-            action_space = gym.spaces.Tuple(action_space)
-        config = config or {}
+        config = config or MODEL_DEFAULTS
         if isinstance(action_space, gym.spaces.Box):
+            if len(action_space.shape) > 1:
+                raise ValueError(
+                    "Action space has multiple dimensions "
+                    "{}. ".format(action_space.shape) +
+                    "Consider reshaping this into a single dimension, "
+                    "using a Tuple action space, or the multi-agent API.")
             if dist_type is None:
                 dist = DiagGaussian
                 if config.get("squash_to_range"):
-                    dist = squash_to_range(dist, action_space.low,
-                                           action_space.high)
+                    raise ValueError(
+                        "The squash_to_range option is deprecated. See the "
+                        "clip_actions agent option instead.")
                 return dist, action_space.shape[0] * 2
-            elif dist_type == 'deterministic':
+            elif dist_type == "deterministic":
                 return Deterministic, action_space.shape[0]
         elif isinstance(action_space, gym.spaces.Discrete):
             return Categorical, action_space.n
@@ -90,7 +125,8 @@ def get_action_dist(action_space, config=None, dist_type=None):
             child_dist = []
             input_lens = []
             for action in action_space.spaces:
-                dist, action_size = ModelCatalog.get_action_dist(action)
+                dist, action_size = ModelCatalog.get_action_dist(
+                    action, config)
                 child_dist.append(dist)
                 input_lens.append(action_size)
             return partial(
@@ -112,10 +148,6 @@ def get_action_placeholder(action_space):
             action_placeholder (Tensor): A placeholder for the actions
         """
 
-        # TODO(ekl) are list spaces valid?
-        if isinstance(action_space, list):
-            action_space = gym.spaces.Tuple(action_space)
-
         if isinstance(action_space, gym.spaces.Box):
             return tf.placeholder(
                 tf.float32, shape=(None, action_space.shape[0]), name="action")
@@ -139,62 +171,71 @@ def get_action_placeholder(action_space):
                                       " not supported".format(action_space))
 
     @staticmethod
-    def get_model(inputs,
+    def get_model(input_dict,
+                  obs_space,
                   num_outputs,
-                  options=None,
+                  options,
                   state_in=None,
                   seq_lens=None):
         """Returns a suitable model conforming to given input and output specs.
 
         Args:
-            inputs (Tensor): The input tensor to the model.
+            input_dict (dict): Dict of input tensors to the model, including
+                the observation under the "obs" key.
+            obs_space (Space): Observation space of the target gym env.
             num_outputs (int): The size of the output vector of the model.
             options (dict): Optional args to pass to the model constructor.
             state_in (list): Optional RNN state in tensors.
             seq_in (Tensor): Optional RNN sequence length tensor.
 
         Returns:
-            model (Model): Neural network model.
+            model (models.Model): Neural network model.
         """
 
-        options = options or {}
-        model = ModelCatalog._get_model(inputs, num_outputs, options, state_in,
-                                        seq_lens)
+        assert isinstance(input_dict, dict)
+        options = options or MODEL_DEFAULTS
+        model = ModelCatalog._get_model(input_dict, obs_space, num_outputs,
+                                        options, state_in, seq_lens)
 
         if options.get("use_lstm"):
-            model = LSTM(model.last_layer, num_outputs, options, state_in,
+            copy = dict(input_dict)
+            copy["obs"] = model.last_layer
+            feature_space = gym.spaces.Box(
+                -1, 1, shape=(model.last_layer.shape[1], ))
+            model = LSTM(copy, feature_space, num_outputs, options, state_in,
                          seq_lens)
 
+        logger.debug("Created model {}: ({} of {}, {}, {}) -> {}, {}".format(
+            model, input_dict, obs_space, state_in, seq_lens, model.outputs,
+            model.state_out))
+
+        model._validate_output_shape()
         return model
 
     @staticmethod
-    def _get_model(inputs, num_outputs, options, state_in, seq_lens):
-        if "custom_model" in options:
+    def _get_model(input_dict, obs_space, num_outputs, options, state_in,
+                   seq_lens):
+        if options.get("custom_model"):
             model = options["custom_model"]
-            print("Using custom model {}".format(model))
+            logger.debug("Using custom model {}".format(model))
             return _global_registry.get(RLLIB_MODEL, model)(
-                inputs,
+                input_dict,
+                obs_space,
                 num_outputs,
                 options,
                 state_in=state_in,
                 seq_lens=seq_lens)
 
-        obs_rank = len(inputs.shape) - 1
-
-        # num_outputs > 1 used to avoid hitting this with the value function
-        if isinstance(
-                options.get("custom_options", {}).get(
-                    "multiagent_fcnet_hiddens", 1), list) and num_outputs > 1:
-            return MultiAgentFullyConnectedNetwork(inputs, num_outputs,
-                                                   options)
+        obs_rank = len(input_dict["obs"].shape) - 1
 
         if obs_rank > 1:
-            return VisionNetwork(inputs, num_outputs, options)
+            return VisionNetwork(input_dict, obs_space, num_outputs, options)
 
-        return FullyConnectedNetwork(inputs, num_outputs, options)
+        return FullyConnectedNetwork(input_dict, obs_space, num_outputs,
+                                     options)
 
     @staticmethod
-    def get_torch_model(input_shape, num_outputs, options={}):
+    def get_torch_model(input_shape, num_outputs, options=None):
         """Returns a PyTorch suitable model. This is currently only supported
         in A3C.
 
@@ -204,16 +245,17 @@ def get_torch_model(input_shape, num_outputs, options={}):
             options (dict): Optional args to pass to the model constructor.
 
         Returns:
-            model (Model): Neural network model.
+            model (models.Model): Neural network model.
         """
         from ray.rllib.models.pytorch.fcnet import (FullyConnectedNetwork as
                                                     PyTorchFCNet)
         from ray.rllib.models.pytorch.visionnet import (VisionNetwork as
                                                         PyTorchVisionNet)
 
-        if "custom_model" in options:
+        options = options or MODEL_DEFAULTS
+        if options.get("custom_model"):
             model = options["custom_model"]
-            print("Using custom torch model {}".format(model))
+            logger.info("Using custom torch model {}".format(model))
             return _global_registry.get(RLLIB_MODEL, model)(
                 input_shape, num_outputs, options)
 
@@ -228,44 +270,68 @@ def get_torch_model(input_shape, num_outputs, options={}):
         return PyTorchFCNet(input_shape[0], num_outputs, options)
 
     @staticmethod
-    def get_preprocessor(env, options={}):
-        """Returns a suitable processor for the given environment.
+    def get_preprocessor(env, options=None):
+        """Returns a suitable preprocessor for the given env.
+
+        This is a wrapper for get_preprocessor_for_space().
+        """
+
+        return ModelCatalog.get_preprocessor_for_space(env.observation_space,
+                                                       options)
+
+    @staticmethod
+    def get_preprocessor_for_space(observation_space, options=None):
+        """Returns a suitable preprocessor for the given observation space.
 
         Args:
-            env (gym.Env): The gym environment to preprocess.
+            observation_space (Space): The input observation space.
             options (dict): Options to pass to the preprocessor.
 
         Returns:
-            preprocessor (Preprocessor): Preprocessor for the env observations.
+            preprocessor (Preprocessor): Preprocessor for the observations.
         """
+
+        options = options or MODEL_DEFAULTS
         for k in options.keys():
-            if k not in MODEL_CONFIGS:
+            if k not in MODEL_DEFAULTS:
                 raise Exception("Unknown config key `{}`, all keys: {}".format(
-                    k, MODEL_CONFIGS))
+                    k, list(MODEL_DEFAULTS)))
 
-        if "custom_preprocessor" in options:
+        if options.get("custom_preprocessor"):
             preprocessor = options["custom_preprocessor"]
-            print("Using custom preprocessor {}".format(preprocessor))
-            return _global_registry.get(RLLIB_PREPROCESSOR, preprocessor)(
-                env.observation_space, options)
+            logger.info("Using custom preprocessor {}".format(preprocessor))
+            prep = _global_registry.get(RLLIB_PREPROCESSOR, preprocessor)(
+                observation_space, options)
+        else:
+            cls = get_preprocessor(observation_space)
+            prep = cls(observation_space, options)
 
-        preprocessor = get_preprocessor(env.observation_space)
-        return preprocessor(env.observation_space, options)
+        logger.debug("Created preprocessor {}: {} -> {}".format(
+            prep, observation_space, prep.shape))
+        return prep
 
     @staticmethod
-    def get_preprocessor_as_wrapper(env, options={}):
+    def get_preprocessor_as_wrapper(env, options=None):
         """Returns a preprocessor as a gym observation wrapper.
 
         Args:
-            env (gym.Env): The gym environment to wrap.
+            env (gym.Env|VectorEnv|ExternalEnv): The environment to wrap.
             options (dict): Options to pass to the preprocessor.
 
         Returns:
-            wrapper (gym.ObservationWrapper): Preprocessor in wrapper form.
+            env (RLlib env): Wrapped environment
         """
 
+        options = options or MODEL_DEFAULTS
         preprocessor = ModelCatalog.get_preprocessor(env, options)
-        return _RLlibPreprocessorWrapper(env, preprocessor)
+        if isinstance(env, gym.Env):
+            return _RLlibPreprocessorWrapper(env, preprocessor)
+        elif isinstance(env, VectorEnv):
+            return _RLlibVectorPreprocessorWrapper(env, preprocessor)
+        elif isinstance(env, ExternalEnv):
+            return _ExternalEnvToAsync(env, preprocessor)
+        else:
+            raise ValueError("Don't know how to wrap {}".format(env))
 
     @staticmethod
     def register_custom_preprocessor(preprocessor_name, preprocessor_class):
@@ -301,10 +367,32 @@ class _RLlibPreprocessorWrapper(gym.ObservationWrapper):
     def __init__(self, env, preprocessor):
         super(_RLlibPreprocessorWrapper, self).__init__(env)
         self.preprocessor = preprocessor
-
-        from gym.spaces.box import Box
-        self.observation_space = Box(
-            -1.0, 1.0, preprocessor.shape, dtype=np.float32)
+        self.observation_space = preprocessor.observation_space
 
     def observation(self, observation):
         return self.preprocessor.transform(observation)
+
+
+class _RLlibVectorPreprocessorWrapper(VectorEnv):
+    """Preprocessing wrapper for vector envs."""
+
+    def __init__(self, env, preprocessor):
+        self.env = env
+        self.prep = preprocessor
+        self.action_space = env.action_space
+        self.observation_space = preprocessor.observation_space
+        self.num_envs = env.num_envs
+
+    def vector_reset(self):
+        return [self.prep.transform(obs) for obs in self.env.vector_reset()]
+
+    def reset_at(self, index):
+        return self.prep.transform(self.env.reset_at(index))
+
+    def vector_step(self, actions):
+        obs, rewards, dones, infos = self.env.vector_step(actions)
+        obs = [self.prep.transform(o) for o in obs]
+        return obs, rewards, dones, infos
+
+    def get_unwrapped(self):
+        return self.env.get_unwrapped()
diff --git a/python/ray/rllib/models/fcnet.py b/python/ray/rllib/models/fcnet.py
index 11aee2c0da8f4..19745b9e7a3ca 100644
--- a/python/ray/rllib/models/fcnet.py
+++ b/python/ray/rllib/models/fcnet.py
@@ -7,14 +7,22 @@
 
 from ray.rllib.models.model import Model
 from ray.rllib.models.misc import normc_initializer, get_activation_fn
+from ray.rllib.utils.annotations import override
 
 
 class FullyConnectedNetwork(Model):
     """Generic fully connected network."""
 
+    @override(Model)
     def _build_layers(self, inputs, num_outputs, options):
-        hiddens = options.get("fcnet_hiddens", [256, 256])
-        activation = get_activation_fn(options.get("fcnet_activation", "tanh"))
+        """Process the flattened inputs.
+
+        Note that dict inputs will be flattened into a vector. To define a
+        model that processes the components separately, use _build_layers_v2().
+        """
+
+        hiddens = options.get("fcnet_hiddens")
+        activation = get_activation_fn(options.get("fcnet_activation"))
 
         with tf.name_scope("fc_net"):
             i = 1
diff --git a/python/ray/rllib/models/lstm.py b/python/ray/rllib/models/lstm.py
index 581569f0eff0c..323c7f375bb3f 100644
--- a/python/ray/rllib/models/lstm.py
+++ b/python/ray/rllib/models/lstm.py
@@ -9,6 +9,10 @@
 postprocessing, we dynamically pad the experience batches so that this
 reshaping is possible.
 
+Note that this padding strategy only works out if we assume zero inputs don't
+meaningfully affect the loss function. This happens to be true for all the
+current algorithms: https://github.com/ray-project/ray/issues/2992
+
 See the add_time_dimension() and chop_into_sequences() functions below for
 more info.
 """
@@ -19,6 +23,72 @@
 
 from ray.rllib.models.misc import linear, normc_initializer
 from ray.rllib.models.model import Model
+from ray.rllib.utils.annotations import override
+
+
+class LSTM(Model):
+    """Adds a LSTM cell on top of some other model output.
+
+    Uses a linear layer at the end for output.
+
+    Important: we assume inputs is a padded batch of sequences denoted by
+        self.seq_lens. See add_time_dimension() for more information.
+    """
+
+    @override(Model)
+    def _build_layers_v2(self, input_dict, num_outputs, options):
+        cell_size = options.get("lstm_cell_size")
+        if options.get("lstm_use_prev_action_reward"):
+            action_dim = int(
+                np.product(
+                    input_dict["prev_actions"].get_shape().as_list()[1:]))
+            features = tf.concat(
+                [
+                    input_dict["obs"],
+                    tf.reshape(
+                        tf.cast(input_dict["prev_actions"], tf.float32),
+                        [-1, action_dim]),
+                    tf.reshape(input_dict["prev_rewards"], [-1, 1]),
+                ],
+                axis=1)
+        else:
+            features = input_dict["obs"]
+        last_layer = add_time_dimension(features, self.seq_lens)
+
+        # Setup the LSTM cell
+        lstm = rnn.BasicLSTMCell(cell_size, state_is_tuple=True)
+        self.state_init = [
+            np.zeros(lstm.state_size.c, np.float32),
+            np.zeros(lstm.state_size.h, np.float32)
+        ]
+
+        # Setup LSTM inputs
+        if self.state_in:
+            c_in, h_in = self.state_in
+        else:
+            c_in = tf.placeholder(
+                tf.float32, [None, lstm.state_size.c], name="c")
+            h_in = tf.placeholder(
+                tf.float32, [None, lstm.state_size.h], name="h")
+            self.state_in = [c_in, h_in]
+
+        # Setup LSTM outputs
+        state_in = rnn.LSTMStateTuple(c_in, h_in)
+        lstm_out, lstm_state = tf.nn.dynamic_rnn(
+            lstm,
+            last_layer,
+            initial_state=state_in,
+            sequence_length=self.seq_lens,
+            time_major=False,
+            dtype=tf.float32)
+
+        self.state_out = list(lstm_state)
+
+        # Compute outputs
+        last_layer = tf.reshape(lstm_out, [-1, cell_size])
+        logits = linear(last_layer, num_outputs, "action",
+                        normc_initializer(0.01))
+        return logits, last_layer
 
 
 def add_time_dimension(padded_inputs, seq_lens):
@@ -48,15 +118,24 @@ def add_time_dimension(padded_inputs, seq_lens):
     return tf.reshape(padded_inputs, new_shape)
 
 
-def chop_into_sequences(episode_ids, feature_columns, state_columns,
-                        max_seq_len):
+def chop_into_sequences(episode_ids,
+                        agent_indices,
+                        feature_columns,
+                        state_columns,
+                        max_seq_len,
+                        dynamic_max=True):
     """Truncate and pad experiences into fixed-length sequences.
 
     Arguments:
         episode_ids (list): List of episode ids for each step.
+        agent_indices (list): List of agent ids for each step. Note that this
+            has to be combined with episode_ids for uniqueness.
         feature_columns (list): List of arrays containing features.
         state_columns (list): List of arrays containing LSTM state values.
         max_seq_len (int): Max length of sequences before truncation.
+        dynamic_max (bool): Whether to dynamically shrink the max seq len.
+            For example, if max len is 20 and the actual max seq len in the
+            data is 7, it will be shrunk to 7.
 
     Returns:
         f_pad (list): Padded feature columns. These will be of shape
@@ -84,19 +163,21 @@ def chop_into_sequences(episode_ids, feature_columns, state_columns,
     prev_id = None
     seq_lens = []
     seq_len = 0
-    for eps_id in episode_ids:
-        if (prev_id is not None and eps_id != prev_id) or \
+    unique_ids = np.add(episode_ids, agent_indices)
+    for uid in unique_ids:
+        if (prev_id is not None and uid != prev_id) or \
                 seq_len >= max_seq_len:
             seq_lens.append(seq_len)
             seq_len = 0
         seq_len += 1
-        prev_id = eps_id
+        prev_id = uid
     if seq_len:
         seq_lens.append(seq_len)
-    assert sum(seq_lens) == len(episode_ids)
+    assert sum(seq_lens) == len(unique_ids)
 
     # Dynamically shrink max len as needed to optimize memory usage
-    max_seq_len = max(seq_lens)
+    if dynamic_max:
+        max_seq_len = max(seq_lens)
 
     feature_sequences = []
     for f in feature_columns:
@@ -109,7 +190,7 @@ def chop_into_sequences(episode_ids, feature_columns, state_columns,
                 f_pad[seq_base + seq_offset] = f[i]
                 i += 1
             seq_base += max_seq_len
-        assert i == len(episode_ids), f
+        assert i == len(unique_ids), f
         feature_sequences.append(f_pad)
 
     initial_states = []
@@ -123,52 +204,3 @@ def chop_into_sequences(episode_ids, feature_columns, state_columns,
         initial_states.append(np.array(s_init))
 
     return feature_sequences, initial_states, np.array(seq_lens)
-
-
-class LSTM(Model):
-    """Adds a LSTM cell on top of some other model output.
-
-    Uses a linear layer at the end for output.
-
-    Important: we assume inputs is a padded batch of sequences denoted by
-        self.seq_lens. See add_time_dimension() for more information.
-    """
-
-    def _build_layers(self, inputs, num_outputs, options):
-        cell_size = options.get("lstm_cell_size", 256)
-        last_layer = add_time_dimension(inputs, self.seq_lens)
-
-        # Setup the LSTM cell
-        lstm = rnn.BasicLSTMCell(cell_size, state_is_tuple=True)
-        self.state_init = [
-            np.zeros(lstm.state_size.c, np.float32),
-            np.zeros(lstm.state_size.h, np.float32)
-        ]
-
-        # Setup LSTM inputs
-        if self.state_in:
-            c_in, h_in = self.state_in
-        else:
-            c_in = tf.placeholder(
-                tf.float32, [None, lstm.state_size.c], name="c")
-            h_in = tf.placeholder(
-                tf.float32, [None, lstm.state_size.h], name="h")
-            self.state_in = [c_in, h_in]
-
-        # Setup LSTM outputs
-        state_in = rnn.LSTMStateTuple(c_in, h_in)
-        lstm_out, lstm_state = tf.nn.dynamic_rnn(
-            lstm,
-            last_layer,
-            initial_state=state_in,
-            sequence_length=self.seq_lens,
-            time_major=False,
-            dtype=tf.float32)
-
-        self.state_out = list(lstm_state)
-
-        # Compute outputs
-        last_layer = tf.reshape(lstm_out, [-1, cell_size])
-        logits = linear(last_layer, num_outputs, "action",
-                        normc_initializer(0.01))
-        return logits, last_layer
diff --git a/python/ray/rllib/models/model.py b/python/ray/rllib/models/model.py
index 00d6575e62104..818966bb12e1a 100644
--- a/python/ray/rllib/models/model.py
+++ b/python/ray/rllib/models/model.py
@@ -2,8 +2,14 @@
 from __future__ import division
 from __future__ import print_function
 
+from collections import OrderedDict
+
+import gym
 import tensorflow as tf
 
+from ray.rllib.models.misc import linear, normc_initializer
+from ray.rllib.models.preprocessors import get_preprocessor
+
 
 class Model(object):
     """Defines an abstract network model for use with RLlib.
@@ -16,12 +22,12 @@ class Model(object):
     needs to further post-processing (e.g. Actor and Critic networks in A3C).
 
     Attributes:
-        inputs (Tensor): The input placeholder for this model, of shape
-            [BATCH_SIZE, ...].
+        input_dict (dict): Dictionary of input tensors, including "obs",
+            "prev_action", "prev_reward", "is_training".
         outputs (Tensor): The output vector of this model, of shape
             [BATCH_SIZE, num_outputs].
-        last_layer (Tensor): The network layer right before the model output,
-            of shape [BATCH_SIZE, N].
+        last_layer (Tensor): The feature layer right before the model output,
+            of shape [BATCH_SIZE, f].
         state_init (list): List of initial recurrent state tensors (if any).
         state_in (list): List of input recurrent state tensors (if any).
         state_out (list): List of output recurrent state tensors (if any).
@@ -38,12 +44,13 @@ class Model(object):
     """
 
     def __init__(self,
-                 inputs,
+                 input_dict,
+                 obs_space,
                  num_outputs,
                  options,
                  state_in=None,
                  seq_lens=None):
-        self.inputs = inputs
+        assert isinstance(input_dict, dict), input_dict
 
         # Default attribute values for the non-RNN case
         self.state_init = []
@@ -55,11 +62,18 @@ def __init__(self,
             self.seq_lens = tf.placeholder(
                 dtype=tf.int32, shape=[None], name="seq_lens")
 
-        if options.get("free_log_std", False):
+        self._num_outputs = num_outputs
+        if options.get("free_log_std"):
             assert num_outputs % 2 == 0
             num_outputs = num_outputs // 2
-        self.outputs, self.last_layer = self._build_layers(
-            inputs, num_outputs, options)
+        try:
+            self.outputs, self.last_layer = self._build_layers_v2(
+                _restore_original_dimensions(input_dict, obs_space),
+                num_outputs, options)
+        except NotImplementedError:
+            self.outputs, self.last_layer = self._build_layers(
+                input_dict["obs"], num_outputs, options)
+
         if options.get("free_log_std", False):
             log_std = tf.get_variable(
                 name="log_std",
@@ -68,6 +82,118 @@ def __init__(self,
             self.outputs = tf.concat(
                 [self.outputs, 0.0 * self.outputs + log_std], 1)
 
-    def _build_layers(self):
-        """Builds and returns the output and last layer of the network."""
+    def _build_layers(self, inputs, num_outputs, options):
+        """Builds and returns the output and last layer of the network.
+
+        Deprecated: use _build_layers_v2 instead, which has better support
+        for dict and tuple spaces.
+        """
+        raise NotImplementedError
+
+    def _build_layers_v2(self, input_dict, num_outputs, options):
+        """Define the layers of a custom model.
+
+        Arguments:
+            input_dict (dict): Dictionary of input tensors, including "obs",
+                "prev_action", "prev_reward", "is_training".
+            num_outputs (int): Output tensor must be of size
+                [BATCH_SIZE, num_outputs].
+            options (dict): Model options.
+
+        Returns:
+            (outputs, feature_layer): Tensors of size [BATCH_SIZE, num_outputs]
+                and [BATCH_SIZE, desired_feature_size].
+
+        When using dict or tuple observation spaces, you can access
+        the nested sub-observation batches here as well:
+
+        Examples:
+            >>> print(input_dict)
+            {'prev_actions': <tf.Tensor shape=(?,) dtype=int64>,
+             'prev_rewards': <tf.Tensor shape=(?,) dtype=float32>,
+             'is_training': <tf.Tensor shape=(), dtype=bool>,
+             'obs': OrderedDict([
+                ('sensors', OrderedDict([
+                    ('front_cam', [
+                        <tf.Tensor shape=(?, 10, 10, 3) dtype=float32>,
+                        <tf.Tensor shape=(?, 10, 10, 3) dtype=float32>]),
+                    ('position', <tf.Tensor shape=(?, 3) dtype=float32>),
+                    ('velocity', <tf.Tensor shape=(?, 3) dtype=float32>)]))])}
+        """
         raise NotImplementedError
+
+    def value_function(self):
+        """Builds the value function output.
+
+        This method can be overridden to customize the implementation of the
+        value function (e.g., not sharing hidden layers).
+
+        Returns:
+            Tensor of size [BATCH_SIZE] for the value function.
+        """
+        return tf.reshape(
+            linear(self.last_layer, 1, "value", normc_initializer(1.0)), [-1])
+
+    def loss(self):
+        """Builds any built-in (self-supervised) loss for the model.
+
+        For example, this can be used to incorporate auto-encoder style losses.
+        Note that this loss has to be included in the policy graph loss to have
+        an effect (done for built-in algorithms).
+
+        Returns:
+            Scalar tensor for the self-supervised loss.
+        """
+        return tf.constant(0.0)
+
+    def _validate_output_shape(self):
+        """Checks that the model has the correct number of outputs."""
+        try:
+            out = tf.convert_to_tensor(self.outputs)
+            shape = out.shape.as_list()
+        except Exception:
+            raise ValueError("Output is not a tensor: {}".format(self.outputs))
+        else:
+            if len(shape) != 2 or shape[1] != self._num_outputs:
+                raise ValueError(
+                    "Expected output shape of [None, {}], got {}".format(
+                        self._num_outputs, shape))
+
+
+def _restore_original_dimensions(input_dict, obs_space):
+    if hasattr(obs_space, "original_space"):
+        return dict(
+            input_dict,
+            obs=_unpack_obs(input_dict["obs"], obs_space.original_space))
+    return input_dict
+
+
+def _unpack_obs(obs, space):
+    if (isinstance(space, gym.spaces.Dict)
+            or isinstance(space, gym.spaces.Tuple)):
+        prep = get_preprocessor(space)(space)
+        if len(obs.shape) != 2 or obs.shape[1] != prep.shape[0]:
+            raise ValueError(
+                "Expected flattened obs shape of [None, {}], got {}".format(
+                    prep.shape[0], obs.shape))
+        assert len(prep.preprocessors) == len(space.spaces), \
+            (len(prep.preprocessors) == len(space.spaces))
+        offset = 0
+        if isinstance(space, gym.spaces.Tuple):
+            u = []
+            for p, v in zip(prep.preprocessors, space.spaces):
+                obs_slice = obs[:, offset:offset + p.size]
+                offset += p.size
+                u.append(
+                    _unpack_obs(
+                        tf.reshape(obs_slice, [-1] + list(p.shape)), v))
+        else:
+            u = OrderedDict()
+            for p, (k, v) in zip(prep.preprocessors, space.spaces.items()):
+                obs_slice = obs[:, offset:offset + p.size]
+                offset += p.size
+                u[k] = _unpack_obs(
+                    tf.reshape(obs_slice, [-1] + list(p.shape)), v)
+        return u
+    else:
+        return obs
diff --git a/python/ray/rllib/models/multiagentfcnet.py b/python/ray/rllib/models/multiagentfcnet.py
deleted file mode 100644
index dad7f29831035..0000000000000
--- a/python/ray/rllib/models/multiagentfcnet.py
+++ /dev/null
@@ -1,43 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import tensorflow as tf
-
-from ray.rllib.models.model import Model
-from ray.rllib.models.fcnet import FullyConnectedNetwork
-from ray.rllib.utils.reshaper import Reshaper
-
-
-class MultiAgentFullyConnectedNetwork(Model):
-    """Multiagent fully connected network."""
-
-    def _build_layers(self, inputs, num_outputs, options):
-        # Split the input and output tensors
-        input_shapes = options["custom_options"]["multiagent_obs_shapes"]
-        output_shapes = options["custom_options"]["multiagent_act_shapes"]
-        input_reshaper = Reshaper(input_shapes)
-        output_reshaper = Reshaper(output_shapes)
-        split_inputs = input_reshaper.split_tensor(inputs)
-        num_actions = output_reshaper.split_number(num_outputs)
-
-        custom_options = options["custom_options"]
-        hiddens = custom_options.get("multiagent_fcnet_hiddens",
-                                     [[256, 256]] * 1)
-
-        # check for a shared model
-        shared_model = custom_options.get("multiagent_shared_model", 0)
-        reuse = tf.AUTO_REUSE if shared_model else False
-        outputs = []
-        for i in range(len(hiddens)):
-            scope = "multi" if shared_model else "multi{}".format(i)
-            with tf.variable_scope(scope, reuse=reuse):
-                sub_options = options.copy()
-                sub_options.update({"fcnet_hiddens": hiddens[i]})
-                # TODO(ev) make this support arbitrary networks
-                fcnet = FullyConnectedNetwork(split_inputs[i],
-                                              int(num_actions[i]), sub_options)
-                output = fcnet.outputs
-                outputs.append(output)
-        overall_output = tf.concat(outputs, axis=1)
-        return overall_output, outputs
diff --git a/python/ray/rllib/models/preprocessors.py b/python/ray/rllib/models/preprocessors.py
index c400dd9805d34..0238ef2d8d889 100644
--- a/python/ray/rllib/models/preprocessors.py
+++ b/python/ray/rllib/models/preprocessors.py
@@ -1,13 +1,20 @@
 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
+
+from collections import OrderedDict
 import cv2
+import logging
 import numpy as np
 import gym
 
+from ray.rllib.utils.annotations import override
+
 ATARI_OBS_SHAPE = (210, 160, 3)
 ATARI_RAM_OBS_SHAPE = (128, )
 
+logger = logging.getLogger(__name__)
+
 
 class Preprocessor(object):
     """Defines an abstract observation preprocessor function.
@@ -16,35 +23,59 @@ class Preprocessor(object):
         shape (obj): Shape of the preprocessed output.
     """
 
-    def __init__(self, obs_space, options):
+    def __init__(self, obs_space, options=None):
         legacy_patch_shapes(obs_space)
         self._obs_space = obs_space
-        self._options = options
-        self._init()
+        self._options = options or {}
+        self.shape = self._init_shape(obs_space, options)
 
-    def _init(self):
-        pass
+    def _init_shape(self, obs_space, options):
+        """Returns the shape after preprocessing."""
+        raise NotImplementedError
 
     def transform(self, observation):
         """Returns the preprocessed observation."""
         raise NotImplementedError
 
+    @property
+    def size(self):
+        return int(np.product(self.shape))
+
+    @property
+    def observation_space(self):
+        obs_space = gym.spaces.Box(-1.0, 1.0, self.shape, dtype=np.float32)
+        # Stash the unwrapped space so that we can unwrap dict and tuple spaces
+        # automatically in model.py
+        if (isinstance(self, TupleFlatteningPreprocessor)
+                or isinstance(self, DictFlatteningPreprocessor)):
+            obs_space.original_space = self._obs_space
+        return obs_space
+
 
-class AtariPixelPreprocessor(Preprocessor):
-    def _init(self):
-        self._grayscale = self._options.get("grayscale", False)
-        self._zero_mean = self._options.get("zero_mean", True)
-        self._dim = self._options.get("dim", 84)
-        self._channel_major = self._options.get("channel_major", False)
+class GenericPixelPreprocessor(Preprocessor):
+    """Generic image preprocessor.
+
+    Note: for Atari games, use config {"preprocessor_pref": "deepmind"}
+    instead for deepmind-style Atari preprocessing.
+    """
+
+    @override(Preprocessor)
+    def _init_shape(self, obs_space, options):
+        self._grayscale = options.get("grayscale")
+        self._zero_mean = options.get("zero_mean")
+        self._dim = options.get("dim")
+        self._channel_major = options.get("channel_major")
         if self._grayscale:
-            self.shape = (self._dim, self._dim, 1)
+            shape = (self._dim, self._dim, 1)
         else:
-            self.shape = (self._dim, self._dim, 3)
+            shape = (self._dim, self._dim, 3)
 
         # channel_major requires (# in-channels, row dim, col dim)
         if self._channel_major:
-            self.shape = self.shape[-1:] + self.shape[:-1]
+            shape = shape[-1:] + shape[:-1]
+        return shape
 
+    @override(Preprocessor)
     def transform(self, observation):
         """Downsamples images from (210, 160, 3) by the configured factor."""
         scaled = observation[25:-25, :, :]
@@ -69,27 +100,36 @@ def transform(self, observation):
 
 
 class AtariRamPreprocessor(Preprocessor):
-    def _init(self):
-        self.shape = (128, )
+    @override(Preprocessor)
+    def _init_shape(self, obs_space, options):
+        return (128, )
 
+    @override(Preprocessor)
     def transform(self, observation):
         return (observation - 128) / 128
 
 
 class OneHotPreprocessor(Preprocessor):
-    def _init(self):
-        self.shape = (self._obs_space.n, )
+    @override(Preprocessor)
+    def _init_shape(self, obs_space, options):
+        return (self._obs_space.n, )
 
+    @override(Preprocessor)
     def transform(self, observation):
         arr = np.zeros(self._obs_space.n)
+        if not self._obs_space.contains(observation):
+            raise ValueError("Observation outside expected value range",
+                             self._obs_space, observation)
         arr[observation] = 1
         return arr
 
 
 class NoPreprocessor(Preprocessor):
-    def _init(self):
-        self.shape = self._obs_space.shape
+    @override(Preprocessor)
+    def _init_shape(self, obs_space, options):
+        return self._obs_space.shape
 
+    @override(Preprocessor)
     def transform(self, observation):
         return observation
 
@@ -97,30 +137,61 @@ def transform(self, observation):
 class TupleFlatteningPreprocessor(Preprocessor):
     """Preprocesses each tuple element, then flattens it all into a vector.
 
-    If desired, the vector output can be unpacked via tf.reshape() within a
-    custom model to handle each component separately.
+    RLlib models will unpack the flattened output before _build_layers_v2().
     """
 
-    def _init(self):
+    @override(Preprocessor)
+    def _init_shape(self, obs_space, options):
         assert isinstance(self._obs_space, gym.spaces.Tuple)
         size = 0
         self.preprocessors = []
         for i in range(len(self._obs_space.spaces)):
             space = self._obs_space.spaces[i]
-            print("Creating sub-preprocessor for", space)
+            logger.debug("Creating sub-preprocessor for {}".format(space))
             preprocessor = get_preprocessor(space)(space, self._options)
             self.preprocessors.append(preprocessor)
-            size += np.product(preprocessor.shape)
-        self.shape = (size, )
+            size += preprocessor.size
+        return (size, )
 
+    @override(Preprocessor)
     def transform(self, observation):
         assert len(observation) == len(self.preprocessors), observation
         return np.concatenate([
-            np.reshape(p.transform(o), [np.product(p.shape)])
+            np.reshape(p.transform(o), [p.size])
             for (o, p) in zip(observation, self.preprocessors)
         ])
 
 
+class DictFlatteningPreprocessor(Preprocessor):
+    """Preprocesses each dict value, then flattens it all into a vector.
+
+    RLlib models will unpack the flattened output before _build_layers_v2().
+    """
+
+    @override(Preprocessor)
+    def _init_shape(self, obs_space, options):
+        assert isinstance(self._obs_space, gym.spaces.Dict)
+        size = 0
+        self.preprocessors = []
+        for space in self._obs_space.spaces.values():
+            logger.debug("Creating sub-preprocessor for {}".format(space))
+            preprocessor = get_preprocessor(space)(space, self._options)
+            self.preprocessors.append(preprocessor)
+            size += preprocessor.size
+        return (size, )
+
+    @override(Preprocessor)
+    def transform(self, observation):
+        if not isinstance(observation, OrderedDict):
+            observation = OrderedDict(sorted(list(observation.items())))
+        assert len(observation) == len(self.preprocessors), \
+            (len(observation), len(self.preprocessors))
+        return np.concatenate([
+            np.reshape(p.transform(o), [p.size])
+            for (o, p) in zip(observation.values(), self.preprocessors)
+        ])
+
+
 def get_preprocessor(space):
     """Returns an appropriate preprocessor class for the given space."""
 
@@ -130,11 +201,13 @@ def get_preprocessor(space):
     if isinstance(space, gym.spaces.Discrete):
         preprocessor = OneHotPreprocessor
     elif obs_shape == ATARI_OBS_SHAPE:
-        preprocessor = AtariPixelPreprocessor
+        preprocessor = GenericPixelPreprocessor
     elif obs_shape == ATARI_RAM_OBS_SHAPE:
         preprocessor = AtariRamPreprocessor
     elif isinstance(space, gym.spaces.Tuple):
         preprocessor = TupleFlatteningPreprocessor
+    elif isinstance(space, gym.spaces.Dict):
+        preprocessor = DictFlatteningPreprocessor
     else:
         preprocessor = NoPreprocessor
 
diff --git a/python/ray/rllib/models/pytorch/fcnet.py b/python/ray/rllib/models/pytorch/fcnet.py
index e8f50da2fb340..f69cb7ca21d45 100644
--- a/python/ray/rllib/models/pytorch/fcnet.py
+++ b/python/ray/rllib/models/pytorch/fcnet.py
@@ -2,10 +2,14 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
+
 from ray.rllib.models.pytorch.model import Model, SlimFC
 from ray.rllib.models.pytorch.misc import normc_initializer
 import torch.nn as nn
 
+logger = logging.getLogger(__name__)
+
 
 class FullyConnectedNetwork(Model):
     """TODO(rliaw): Logits, Value should both be contained here"""
@@ -19,7 +23,7 @@ def _build_layers(self, inputs, num_outputs, options):
             activation = nn.Tanh
         elif fcnet_activation == "relu":
             activation = nn.ReLU
-        print("Constructing fcnet {} {}".format(hiddens, activation))
+        logger.info("Constructing fcnet {} {}".format(hiddens, activation))
 
         layers = []
         last_layer_size = inputs
diff --git a/python/ray/rllib/models/pytorch/visionnet.py b/python/ray/rllib/models/pytorch/visionnet.py
index 94ac8291d79af..e54c51897f2c3 100644
--- a/python/ray/rllib/models/pytorch/visionnet.py
+++ b/python/ray/rllib/models/pytorch/visionnet.py
@@ -18,11 +18,11 @@ def _build_layers(self, inputs, num_outputs, options):
             inputs (tuple): (channels, rows/height, cols/width)
             num_outputs (int): logits size
         """
-        filters = options.get("conv_filters", [
+        filters = options.get("conv_filters") or [
             [16, [8, 8], 4],
             [32, [4, 4], 2],
             [512, [11, 11], 1],
-        ])
+        ]
         layers = []
         in_channels, in_size = inputs[0], inputs[1:]
 
diff --git a/python/ray/rllib/models/visionnet.py b/python/ray/rllib/models/visionnet.py
index 805d2e9e5ebef..0638c4fc83c59 100644
--- a/python/ray/rllib/models/visionnet.py
+++ b/python/ray/rllib/models/visionnet.py
@@ -7,17 +7,20 @@
 
 from ray.rllib.models.model import Model
 from ray.rllib.models.misc import get_activation_fn, flatten
+from ray.rllib.utils.annotations import override
 
 
 class VisionNetwork(Model):
     """Generic vision network."""
 
-    def _build_layers(self, inputs, num_outputs, options):
+    @override(Model)
+    def _build_layers_v2(self, input_dict, num_outputs, options):
+        inputs = input_dict["obs"]
         filters = options.get("conv_filters")
         if not filters:
-            filters = get_filter_config(options)
+            filters = _get_filter_config(inputs)
 
-        activation = get_activation_fn(options.get("conv_activation", "relu"))
+        activation = get_activation_fn(options.get("conv_activation"))
 
         with tf.name_scope("vision_net"):
             for i, (out_size, kernel, stride) in enumerate(filters[:-1], 1):
@@ -46,7 +49,7 @@ def _build_layers(self, inputs, num_outputs, options):
             return flatten(fc2), flatten(fc1)
 
 
-def get_filter_config(options):
+def _get_filter_config(inputs):
     filters_84x84 = [
         [16, [8, 8], 4],
         [32, [4, 4], 2],
@@ -57,12 +60,15 @@ def get_filter_config(options):
         [32, [4, 4], 2],
         [256, [11, 11], 1],
     ]
-    dim = options.get("dim", 84)
-    if dim == 84:
+    shape = inputs.shape.as_list()[1:]
+    if len(shape) == 3 and shape[:2] == [84, 84]:
         return filters_84x84
-    elif dim == 42:
+    elif len(shape) == 3 and shape[:2] == [42, 42]:
         return filters_42x42
     else:
         raise ValueError(
-            "No default configuration for image size={}".format(dim) +
-            ", you must specify `conv_filters` manually as a model option.")
+            "No default configuration for obs input {}".format(inputs) +
+            ", you must specify `conv_filters` manually as a model option. "
+            "Default configurations are only available for inputs of size "
+            "[?, 42, 42, K] and [?, 84, 84, K]. You may alternatively want "
+            "to use a custom model or preprocessor.")
diff --git a/python/ray/rllib/optimizers/async_gradients_optimizer.py b/python/ray/rllib/optimizers/async_gradients_optimizer.py
index fc7fdb2488a33..b1e5ebe846ca6 100644
--- a/python/ray/rllib/optimizers/async_gradients_optimizer.py
+++ b/python/ray/rllib/optimizers/async_gradients_optimizer.py
@@ -4,6 +4,7 @@
 
 import ray
 from ray.rllib.optimizers.policy_optimizer import PolicyOptimizer
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.timer import TimerStat
 
 
@@ -15,6 +16,7 @@ class AsyncGradientsOptimizer(PolicyOptimizer):
     gradient computations on the remote workers.
     """
 
+    @override(PolicyOptimizer)
     def _init(self, grads_per_step=100):
         self.apply_timer = TimerStat()
         self.wait_timer = TimerStat()
@@ -25,23 +27,29 @@ def _init(self, grads_per_step=100):
             raise ValueError(
                 "Async optimizer requires at least 1 remote evaluator")
 
+    @override(PolicyOptimizer)
     def step(self):
         weights = ray.put(self.local_evaluator.get_weights())
-        gradient_queue = []
+        pending_gradients = {}
         num_gradients = 0
 
         # Kick off the first wave of async tasks
         for e in self.remote_evaluators:
             e.set_weights.remote(weights)
-            fut = e.compute_gradients.remote(e.sample.remote())
-            gradient_queue.append((fut, e))
+            future = e.compute_gradients.remote(e.sample.remote())
+            pending_gradients[future] = e
             num_gradients += 1
 
-        # Note: can't use wait: https://github.com/ray-project/ray/issues/1128
-        while gradient_queue:
+        while pending_gradients:
             with self.wait_timer:
-                fut, e = gradient_queue.pop(0)
-                gradient, info = ray.get(fut)
+                wait_results = ray.wait(
+                    list(pending_gradients.keys()), num_returns=1)
+                ready_list = wait_results[0]
+                future = ready_list[0]
+
+                gradient, info = ray.get(future)
+                e = pending_gradients.pop(future)
+
                 if "stats" in info:
                     self.learner_stats = info["stats"]
 
@@ -54,10 +62,12 @@ def step(self):
             if num_gradients < self.grads_per_step:
                 with self.dispatch_timer:
                     e.set_weights.remote(self.local_evaluator.get_weights())
-                    fut = e.compute_gradients.remote(e.sample.remote())
-                    gradient_queue.append((fut, e))
+                    future = e.compute_gradients.remote(e.sample.remote())
+
+                    pending_gradients[future] = e
                     num_gradients += 1
 
+    @override(PolicyOptimizer)
     def stats(self):
         return dict(
             PolicyOptimizer.stats(self), **{
diff --git a/python/ray/rllib/optimizers/async_replay_optimizer.py b/python/ray/rllib/optimizers/async_replay_optimizer.py
index 3ed5f37d390fe..582bb65396c14 100644
--- a/python/ray/rllib/optimizers/async_replay_optimizer.py
+++ b/python/ray/rllib/optimizers/async_replay_optimizer.py
@@ -6,6 +6,7 @@
 from __future__ import division
 from __future__ import print_function
 
+import collections
 import os
 import random
 import time
@@ -15,9 +16,11 @@
 from six.moves import queue
 
 import ray
+from ray.rllib.evaluation.sample_batch import SampleBatch, DEFAULT_POLICY_ID, \
+    MultiAgentBatch
 from ray.rllib.optimizers.policy_optimizer import PolicyOptimizer
 from ray.rllib.optimizers.replay_buffer import PrioritizedReplayBuffer
-from ray.rllib.evaluation.sample_batch import SampleBatch
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.actors import TaskPool, create_colocated
 from ray.rllib.utils.timer import TimerStat
 from ray.rllib.utils.window_stat import WindowStat
@@ -27,113 +30,6 @@
 LEARNER_QUEUE_MAX_SIZE = 16
 
 
-@ray.remote(num_cpus=0)
-class ReplayActor(object):
-    """A replay buffer shard.
-
-    Ray actors are single-threaded, so for scalability multiple replay actors
-    may be created to increase parallelism."""
-
-    def __init__(self, num_shards, learning_starts, buffer_size,
-                 train_batch_size, prioritized_replay_alpha,
-                 prioritized_replay_beta, prioritized_replay_eps):
-        self.replay_starts = learning_starts // num_shards
-        self.buffer_size = buffer_size // num_shards
-        self.train_batch_size = train_batch_size
-        self.prioritized_replay_beta = prioritized_replay_beta
-        self.prioritized_replay_eps = prioritized_replay_eps
-
-        self.replay_buffer = PrioritizedReplayBuffer(
-            self.buffer_size, alpha=prioritized_replay_alpha)
-
-        # Metrics
-        self.add_batch_timer = TimerStat()
-        self.replay_timer = TimerStat()
-        self.update_priorities_timer = TimerStat()
-
-    def get_host(self):
-        return os.uname()[1]
-
-    def add_batch(self, batch):
-        PolicyOptimizer._check_not_multiagent(batch)
-        with self.add_batch_timer:
-            for row in batch.rows():
-                self.replay_buffer.add(row["obs"], row["actions"],
-                                       row["rewards"], row["new_obs"],
-                                       row["dones"], row["weights"])
-
-    def replay(self):
-        with self.replay_timer:
-            if len(self.replay_buffer) < self.replay_starts:
-                return None
-
-            (obses_t, actions, rewards, obses_tp1, dones, weights,
-             batch_indexes) = self.replay_buffer.sample(
-                 self.train_batch_size, beta=self.prioritized_replay_beta)
-
-            batch = SampleBatch({
-                "obs": obses_t,
-                "actions": actions,
-                "rewards": rewards,
-                "new_obs": obses_tp1,
-                "dones": dones,
-                "weights": weights,
-                "batch_indexes": batch_indexes
-            })
-            return batch
-
-    def update_priorities(self, batch_indexes, td_errors):
-        with self.update_priorities_timer:
-            new_priorities = (np.abs(td_errors) + self.prioritized_replay_eps)
-            self.replay_buffer.update_priorities(batch_indexes, new_priorities)
-
-    def stats(self):
-        stat = {
-            "add_batch_time_ms": round(1000 * self.add_batch_timer.mean, 3),
-            "replay_time_ms": round(1000 * self.replay_timer.mean, 3),
-            "update_priorities_time_ms": round(
-                1000 * self.update_priorities_timer.mean, 3),
-        }
-        stat.update(self.replay_buffer.stats())
-        return stat
-
-
-class LearnerThread(threading.Thread):
-    """Background thread that updates the local model from replay data.
-
-    The learner thread communicates with the main thread through Queues. This
-    is needed since Ray operations can only be run on the main thread. In
-    addition, moving heavyweight gradient ops session runs off the main thread
-    improves overall throughput.
-    """
-
-    def __init__(self, local_evaluator):
-        threading.Thread.__init__(self)
-        self.learner_queue_size = WindowStat("size", 50)
-        self.local_evaluator = local_evaluator
-        self.inqueue = queue.Queue(maxsize=LEARNER_QUEUE_MAX_SIZE)
-        self.outqueue = queue.Queue()
-        self.queue_timer = TimerStat()
-        self.grad_timer = TimerStat()
-        self.daemon = True
-        self.weights_updated = False
-
-    def run(self):
-        while True:
-            self.step()
-
-    def step(self):
-        with self.queue_timer:
-            ra, replay = self.inqueue.get()
-        if replay is not None:
-            with self.grad_timer:
-                td_error = self.local_evaluator.compute_apply(replay)[
-                    "td_error"]
-            self.outqueue.put((ra, replay, td_error, replay.count))
-        self.learner_queue_size.push(self.inqueue.qsize())
-        self.weights_updated = True
-
-
 class AsyncReplayOptimizer(PolicyOptimizer):
     """Main event loop of the Ape-X optimizer (async sampling with replay).
 
@@ -144,6 +40,7 @@ class AsyncReplayOptimizer(PolicyOptimizer):
     "td_error" array in the info return of compute_gradients(). This error
     term will be used for sample prioritization."""
 
+    @override(PolicyOptimizer)
     def _init(self,
               learning_starts=1000,
               buffer_size=10000,
@@ -180,11 +77,12 @@ def _init(self,
         self.timers = {
             k: TimerStat()
             for k in [
-                "put_weights", "get_samples", "enqueue", "sample_processing",
+                "put_weights", "get_samples", "sample_processing",
                 "replay_processing", "update_priorities", "train", "sample"
             ]
         }
         self.num_weight_syncs = 0
+        self.num_samples_dropped = 0
         self.learning_started = False
 
         # Number of worker steps since the last weight update
@@ -199,18 +97,9 @@ def _init(self,
         # Kick off async background sampling
         self.sample_tasks = TaskPool()
         if self.remote_evaluators:
-            self.set_evaluators(self.remote_evaluators)
-
-    # For https://github.com/ray-project/ray/issues/2541 only
-    def set_evaluators(self, remote_evaluators):
-        self.remote_evaluators = remote_evaluators
-        weights = self.local_evaluator.get_weights()
-        for ev in self.remote_evaluators:
-            ev.set_weights.remote(weights)
-            self.steps_since_update[ev] = 0
-            for _ in range(SAMPLE_QUEUE_DEPTH):
-                self.sample_tasks.add(ev, ev.sample_with_count.remote())
+            self._set_evaluators(self.remote_evaluators)
 
+    @override(PolicyOptimizer)
     def step(self):
         assert len(self.remote_evaluators) > 0
         start = time.time()
@@ -226,6 +115,53 @@ def step(self):
         self.num_steps_sampled += sample_timesteps
         self.num_steps_trained += train_timesteps
 
+    @override(PolicyOptimizer)
+    def stop(self):
+        for r in self.replay_actors:
+            r.__ray_terminate__.remote()
+        self.learner.stopped = True
+
+    @override(PolicyOptimizer)
+    def stats(self):
+        replay_stats = ray.get(self.replay_actors[0].stats.remote(self.debug))
+        timing = {
+            "{}_time_ms".format(k): round(1000 * self.timers[k].mean, 3)
+            for k in self.timers
+        }
+        timing["learner_grad_time_ms"] = round(
+            1000 * self.learner.grad_timer.mean, 3)
+        timing["learner_dequeue_time_ms"] = round(
+            1000 * self.learner.queue_timer.mean, 3)
+        stats = {
+            "sample_throughput": round(self.timers["sample"].mean_throughput,
+                                       3),
+            "train_throughput": round(self.timers["train"].mean_throughput, 3),
+            "num_weight_syncs": self.num_weight_syncs,
+            "num_samples_dropped": self.num_samples_dropped,
+            "learner_queue": self.learner.learner_queue_size.stats(),
+            "replay_shard_0": replay_stats,
+        }
+        debug_stats = {
+            "timing_breakdown": timing,
+            "pending_sample_tasks": self.sample_tasks.count,
+            "pending_replay_tasks": self.replay_tasks.count,
+        }
+        if self.debug:
+            stats.update(debug_stats)
+        if self.learner.stats:
+            stats["learner"] = self.learner.stats
+        return dict(PolicyOptimizer.stats(self), **stats)
+
+    # For https://github.com/ray-project/ray/issues/2541 only
+    def _set_evaluators(self, remote_evaluators):
+        self.remote_evaluators = remote_evaluators
+        weights = self.local_evaluator.get_weights()
+        for ev in self.remote_evaluators:
+            ev.set_weights.remote(weights)
+            self.steps_since_update[ev] = 0
+            for _ in range(SAMPLE_QUEUE_DEPTH):
+                self.sample_tasks.add(ev, ev.sample_with_count.remote())
+
     def _step(self):
         sample_timesteps, train_timesteps = 0, 0
         weights = None
@@ -260,42 +196,148 @@ def _step(self):
         with self.timers["replay_processing"]:
             for ra, replay in self.replay_tasks.completed():
                 self.replay_tasks.add(ra, ra.replay.remote())
-                with self.timers["get_samples"]:
-                    samples = ray.get(replay)
-                with self.timers["enqueue"]:
-                    self.learner.inqueue.put((ra, samples))
+                if self.learner.inqueue.full():
+                    self.num_samples_dropped += 1
+                else:
+                    with self.timers["get_samples"]:
+                        samples = ray.get(replay)
+                    # Defensive copy against plasma crashes, see #2610 #3452
+                    self.learner.inqueue.put((ra, samples and samples.copy()))
 
         with self.timers["update_priorities"]:
             while not self.learner.outqueue.empty():
-                ra, replay, td_error, count = self.learner.outqueue.get()
-                ra.update_priorities.remote(replay["batch_indexes"], td_error)
+                ra, prio_dict, count = self.learner.outqueue.get()
+                ra.update_priorities.remote(prio_dict)
                 train_timesteps += count
 
         return sample_timesteps, train_timesteps
 
-    def stats(self):
-        replay_stats = ray.get(self.replay_actors[0].stats.remote())
-        timing = {
-            "{}_time_ms".format(k): round(1000 * self.timers[k].mean, 3)
-            for k in self.timers
-        }
-        timing["learner_grad_time_ms"] = round(
-            1000 * self.learner.grad_timer.mean, 3)
-        timing["learner_dequeue_time_ms"] = round(
-            1000 * self.learner.queue_timer.mean, 3)
-        stats = {
-            "sample_throughput": round(self.timers["sample"].mean_throughput,
-                                       3),
-            "train_throughput": round(self.timers["train"].mean_throughput, 3),
-            "num_weight_syncs": self.num_weight_syncs,
-        }
-        debug_stats = {
-            "replay_shard_0": replay_stats,
-            "timing_breakdown": timing,
-            "pending_sample_tasks": self.sample_tasks.count,
-            "pending_replay_tasks": self.replay_tasks.count,
-            "learner_queue": self.learner.learner_queue_size.stats(),
+
+@ray.remote(num_cpus=0)
+class ReplayActor(object):
+    """A replay buffer shard.
+
+    Ray actors are single-threaded, so for scalability multiple replay actors
+    may be created to increase parallelism."""
+
+    def __init__(self, num_shards, learning_starts, buffer_size,
+                 train_batch_size, prioritized_replay_alpha,
+                 prioritized_replay_beta, prioritized_replay_eps):
+        self.replay_starts = learning_starts // num_shards
+        self.buffer_size = buffer_size // num_shards
+        self.train_batch_size = train_batch_size
+        self.prioritized_replay_beta = prioritized_replay_beta
+        self.prioritized_replay_eps = prioritized_replay_eps
+
+        def new_buffer():
+            return PrioritizedReplayBuffer(
+                self.buffer_size, alpha=prioritized_replay_alpha)
+
+        self.replay_buffers = collections.defaultdict(new_buffer)
+
+        # Metrics
+        self.add_batch_timer = TimerStat()
+        self.replay_timer = TimerStat()
+        self.update_priorities_timer = TimerStat()
+        self.num_added = 0
+
+    def get_host(self):
+        return os.uname()[1]
+
+    def add_batch(self, batch):
+        # Handle everything as if multiagent
+        if isinstance(batch, SampleBatch):
+            batch = MultiAgentBatch({DEFAULT_POLICY_ID: batch}, batch.count)
+        with self.add_batch_timer:
+            for policy_id, s in batch.policy_batches.items():
+                for row in s.rows():
+                    self.replay_buffers[policy_id].add(
+                        row["obs"], row["actions"], row["rewards"],
+                        row["new_obs"], row["dones"], row["weights"])
+        self.num_added += batch.count
+
+    def replay(self):
+        if self.num_added < self.replay_starts:
+            return None
+
+        with self.replay_timer:
+            samples = {}
+            for policy_id, replay_buffer in self.replay_buffers.items():
+                (obses_t, actions, rewards, obses_tp1, dones, weights,
+                 batch_indexes) = replay_buffer.sample(
+                     self.train_batch_size, beta=self.prioritized_replay_beta)
+                samples[policy_id] = SampleBatch({
+                    "obs": obses_t,
+                    "actions": actions,
+                    "rewards": rewards,
+                    "new_obs": obses_tp1,
+                    "dones": dones,
+                    "weights": weights,
+                    "batch_indexes": batch_indexes
+                })
+            return MultiAgentBatch(samples, self.train_batch_size)
+
+    def update_priorities(self, prio_dict):
+        with self.update_priorities_timer:
+            for policy_id, (batch_indexes, td_errors) in prio_dict.items():
+                new_priorities = (
+                    np.abs(td_errors) + self.prioritized_replay_eps)
+                self.replay_buffers[policy_id].update_priorities(
+                    batch_indexes, new_priorities)
+
+    def stats(self, debug=False):
+        stat = {
+            "add_batch_time_ms": round(1000 * self.add_batch_timer.mean, 3),
+            "replay_time_ms": round(1000 * self.replay_timer.mean, 3),
+            "update_priorities_time_ms": round(
+                1000 * self.update_priorities_timer.mean, 3),
         }
-        if self.debug:
-            stats.update(debug_stats)
-        return dict(PolicyOptimizer.stats(self), **stats)
+        for policy_id, replay_buffer in self.replay_buffers.items():
+            stat.update({
+                "policy_{}".format(policy_id): replay_buffer.stats(debug=debug)
+            })
+        return stat
+
+
+class LearnerThread(threading.Thread):
+    """Background thread that updates the local model from replay data.
+
+    The learner thread communicates with the main thread through Queues. This
+    is needed since Ray operations can only be run on the main thread. In
+    addition, moving heavyweight gradient ops session runs off the main thread
+    improves overall throughput.
+    """
+
+    def __init__(self, local_evaluator):
+        threading.Thread.__init__(self)
+        self.learner_queue_size = WindowStat("size", 50)
+        self.local_evaluator = local_evaluator
+        self.inqueue = queue.Queue(maxsize=LEARNER_QUEUE_MAX_SIZE)
+        self.outqueue = queue.Queue()
+        self.queue_timer = TimerStat()
+        self.grad_timer = TimerStat()
+        self.daemon = True
+        self.weights_updated = False
+        self.stopped = False
+        self.stats = {}
+
+    def run(self):
+        while not self.stopped:
+            self.step()
+
+    def step(self):
+        with self.queue_timer:
+            ra, replay = self.inqueue.get()
+        if replay is not None:
+            prio_dict = {}
+            with self.grad_timer:
+                grad_out = self.local_evaluator.compute_apply(replay)
+                for pid, info in grad_out.items():
+                    prio_dict[pid] = (
+                        replay.policy_batches[pid]["batch_indexes"],
+                        info["td_error"])
+                    if "stats" in info:
+                        self.stats[pid] = info["stats"]
+            self.outqueue.put((ra, prio_dict, replay.count))
+        self.learner_queue_size.push(self.inqueue.qsize())
+        self.weights_updated = True
diff --git a/python/ray/rllib/optimizers/async_samples_optimizer.py b/python/ray/rllib/optimizers/async_samples_optimizer.py
index 3b6bb861b4824..ad0d86dfc2c36 100644
--- a/python/ray/rllib/optimizers/async_samples_optimizer.py
+++ b/python/ray/rllib/optimizers/async_samples_optimizer.py
@@ -6,58 +6,26 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
+import numpy as np
+import random
 import time
 import threading
 
 from six.moves import queue
 
 import ray
+from ray.rllib.optimizers.multi_gpu_impl import LocalSyncParallelOptimizer
 from ray.rllib.optimizers.policy_optimizer import PolicyOptimizer
 from ray.rllib.utils.actors import TaskPool
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.timer import TimerStat
 from ray.rllib.utils.window_stat import WindowStat
 
-SAMPLE_QUEUE_DEPTH = 2
-LEARNER_QUEUE_MAX_SIZE = 16
-
-
-class LearnerThread(threading.Thread):
-    """Background thread that updates the local model from sample trajectories.
-
-    The learner thread communicates with the main thread through Queues. This
-    is needed since Ray operations can only be run on the main thread. In
-    addition, moving heavyweight gradient ops session runs off the main thread
-    improves overall throughput.
-    """
+logger = logging.getLogger(__name__)
 
-    def __init__(self, local_evaluator):
-        threading.Thread.__init__(self)
-        self.learner_queue_size = WindowStat("size", 50)
-        self.local_evaluator = local_evaluator
-        self.inqueue = queue.Queue(maxsize=LEARNER_QUEUE_MAX_SIZE)
-        self.outqueue = queue.Queue()
-        self.queue_timer = TimerStat()
-        self.grad_timer = TimerStat()
-        self.daemon = True
-        self.weights_updated = 0
-        self.stats = {}
-
-    def run(self):
-        while True:
-            self.step()
-
-    def step(self):
-        with self.queue_timer:
-            ra, batch = self.inqueue.get()
-
-        if batch is not None:
-            with self.grad_timer:
-                fetches = self.local_evaluator.compute_apply(batch)
-                self.weights_updated += 1
-                if "stats" in fetches:
-                    self.stats = fetches["stats"]
-            self.outqueue.put(batch.count)
-        self.learner_queue_size.push(self.inqueue.qsize())
+LEARNER_QUEUE_MAX_SIZE = 16
+NUM_DATA_LOAD_THREADS = 16
 
 
 class AsyncSamplesOptimizer(PolicyOptimizer):
@@ -67,24 +35,49 @@ class AsyncSamplesOptimizer(PolicyOptimizer):
     and remote evaluators (IMPALA actors).
     """
 
-    def _init(self, train_batch_size=512, sample_batch_size=50, debug=False):
-
-        self.debug = debug
+    @override(PolicyOptimizer)
+    def _init(self,
+              train_batch_size=500,
+              sample_batch_size=50,
+              num_envs_per_worker=1,
+              num_gpus=0,
+              lr=0.0005,
+              grad_clip=40,
+              replay_buffer_num_slots=0,
+              replay_proportion=0.0,
+              num_parallel_data_loaders=1,
+              max_sample_requests_in_flight_per_worker=2,
+              broadcast_interval=1):
         self.learning_started = False
         self.train_batch_size = train_batch_size
+        self.sample_batch_size = sample_batch_size
+        self.broadcast_interval = broadcast_interval
 
-        self.learner = LearnerThread(self.local_evaluator)
+        if num_gpus > 1 or num_parallel_data_loaders > 1:
+            logger.info(
+                "Enabling multi-GPU mode, {} GPUs, {} parallel loaders".format(
+                    num_gpus, num_parallel_data_loaders))
+            if train_batch_size // max(1, num_gpus) % (
+                    sample_batch_size // num_envs_per_worker) != 0:
+                raise ValueError(
+                    "Sample batches must evenly divide across GPUs.")
+            self.learner = TFMultiGPULearner(
+                self.local_evaluator,
+                lr=lr,
+                num_gpus=num_gpus,
+                train_batch_size=train_batch_size,
+                grad_clip=grad_clip,
+                num_parallel_data_loaders=num_parallel_data_loaders)
+        else:
+            self.learner = LearnerThread(self.local_evaluator)
         self.learner.start()
 
         assert len(self.remote_evaluators) > 0
 
         # Stats
-        self.timers = {
-            k: TimerStat()
-            for k in
-            ["put_weights", "enqueue", "sample_processing", "train", "sample"]
-        }
+        self.timers = {k: TimerStat() for k in ["train", "sample"]}
         self.num_weight_syncs = 0
+        self.num_replayed = 0
         self.learning_started = False
 
         # Kick off async background sampling
@@ -92,11 +85,20 @@ def _init(self, train_batch_size=512, sample_batch_size=50, debug=False):
         weights = self.local_evaluator.get_weights()
         for ev in self.remote_evaluators:
             ev.set_weights.remote(weights)
-            for _ in range(SAMPLE_QUEUE_DEPTH):
+            for _ in range(max_sample_requests_in_flight_per_worker):
                 self.sample_tasks.add(ev, ev.sample.remote())
 
         self.batch_buffer = []
 
+        if replay_proportion:
+            assert replay_buffer_num_slots > 0
+            assert (replay_buffer_num_slots * sample_batch_size >
+                    train_batch_size)
+        self.replay_proportion = replay_proportion
+        self.replay_buffer_num_slots = replay_buffer_num_slots
+        self.replay_batches = []
+
+    @override(PolicyOptimizer)
     def step(self):
         assert self.learner.is_alive()
         start = time.time()
@@ -112,41 +114,11 @@ def step(self):
         self.num_steps_sampled += sample_timesteps
         self.num_steps_trained += train_timesteps
 
-    def _step(self):
-        sample_timesteps, train_timesteps = 0, 0
-        weights = None
-
-        with self.timers["sample_processing"]:
-            for ev, sample_batch in self.sample_tasks.completed_prefetch():
-                sample_batch = ray.get(sample_batch)
-                sample_timesteps += sample_batch.count
-                self.batch_buffer.append(sample_batch)
-                if sum(b.count
-                       for b in self.batch_buffer) >= self.train_batch_size:
-                    train_batch = self.batch_buffer[0].concat_samples(
-                        self.batch_buffer)
-                    with self.timers["enqueue"]:
-                        self.learner.inqueue.put((ev, train_batch))
-                    self.batch_buffer = []
-
-                # Note that it's important to pull new weights once
-                # updated to avoid excessive correlation between actors
-                if weights is None or self.learner.weights_updated:
-                    self.learner.weights_updated = False
-                    with self.timers["put_weights"]:
-                        weights = ray.put(self.local_evaluator.get_weights())
-                ev.set_weights.remote(weights)
-                self.num_weight_syncs += 1
-
-                # Kick off another sample request
-                self.sample_tasks.add(ev, ev.sample.remote())
-
-        while not self.learner.outqueue.empty():
-            count = self.learner.outqueue.get()
-            train_timesteps += count
-
-        return sample_timesteps, train_timesteps
+    @override(PolicyOptimizer)
+    def stop(self):
+        self.learner.stopped = True
 
+    @override(PolicyOptimizer)
     def stats(self):
         timing = {
             "{}_time_ms".format(k): round(1000 * self.timers[k].mean, 3)
@@ -154,6 +126,10 @@ def stats(self):
         }
         timing["learner_grad_time_ms"] = round(
             1000 * self.learner.grad_timer.mean, 3)
+        timing["learner_load_time_ms"] = round(
+            1000 * self.learner.load_timer.mean, 3)
+        timing["learner_load_wait_time_ms"] = round(
+            1000 * self.learner.load_wait_timer.mean, 3)
         timing["learner_dequeue_time_ms"] = round(
             1000 * self.learner.queue_timer.mean, 3)
         stats = {
@@ -161,14 +137,229 @@ def stats(self):
                                        3),
             "train_throughput": round(self.timers["train"].mean_throughput, 3),
             "num_weight_syncs": self.num_weight_syncs,
-        }
-        debug_stats = {
+            "num_steps_replayed": self.num_replayed,
             "timing_breakdown": timing,
-            "pending_sample_tasks": self.sample_tasks.count,
             "learner_queue": self.learner.learner_queue_size.stats(),
         }
-        if self.debug:
-            stats.update(debug_stats)
         if self.learner.stats:
             stats["learner"] = self.learner.stats
         return dict(PolicyOptimizer.stats(self), **stats)
+
+    def _step(self):
+        sample_timesteps, train_timesteps = 0, 0
+        num_sent = 0
+        weights = None
+
+        for ev, sample_batch in self._augment_with_replay(
+                self.sample_tasks.completed_prefetch()):
+            self.batch_buffer.append(sample_batch)
+            if sum(b.count
+                   for b in self.batch_buffer) >= self.train_batch_size:
+                train_batch = self.batch_buffer[0].concat_samples(
+                    self.batch_buffer)
+                self.learner.inqueue.put(train_batch)
+                self.batch_buffer = []
+
+            # If the batch was replayed, skip the update below.
+            if ev is None:
+                continue
+
+            sample_timesteps += sample_batch.count
+
+            # Put in replay buffer if enabled
+            if self.replay_buffer_num_slots > 0:
+                self.replay_batches.append(sample_batch)
+                if len(self.replay_batches) > self.replay_buffer_num_slots:
+                    self.replay_batches.pop(0)
+
+            # Note that it's important to pull new weights once
+            # updated to avoid excessive correlation between actors
+            if weights is None or (self.learner.weights_updated
+                                   and num_sent >= self.broadcast_interval):
+                self.learner.weights_updated = False
+                weights = ray.put(self.local_evaluator.get_weights())
+                num_sent = 0
+            ev.set_weights.remote(weights)
+            self.num_weight_syncs += 1
+            num_sent += 1
+
+            # Kick off another sample request
+            self.sample_tasks.add(ev, ev.sample.remote())
+
+        while not self.learner.outqueue.empty():
+            count = self.learner.outqueue.get()
+            train_timesteps += count
+
+        return sample_timesteps, train_timesteps
+
+    def _augment_with_replay(self, sample_futures):
+        def can_replay():
+            num_needed = int(
+                np.ceil(self.train_batch_size / self.sample_batch_size))
+            return len(self.replay_batches) > num_needed
+
+        for ev, sample_batch in sample_futures:
+            sample_batch = ray.get(sample_batch)
+            yield ev, sample_batch
+
+            if can_replay():
+                f = self.replay_proportion
+                while random.random() < f:
+                    f -= 1
+                    replay_batch = random.choice(self.replay_batches)
+                    self.num_replayed += replay_batch.count
+                    yield None, replay_batch
+
+
+class LearnerThread(threading.Thread):
+    """Background thread that updates the local model from sample trajectories.
+
+    The learner thread communicates with the main thread through Queues. This
+    is needed since Ray operations can only be run on the main thread. In
+    addition, moving heavyweight gradient ops session runs off the main thread
+    improves overall throughput.
+    """
+
+    def __init__(self, local_evaluator):
+        threading.Thread.__init__(self)
+        self.learner_queue_size = WindowStat("size", 50)
+        self.local_evaluator = local_evaluator
+        self.inqueue = queue.Queue(maxsize=LEARNER_QUEUE_MAX_SIZE)
+        self.outqueue = queue.Queue()
+        self.queue_timer = TimerStat()
+        self.grad_timer = TimerStat()
+        self.load_timer = TimerStat()
+        self.load_wait_timer = TimerStat()
+        self.daemon = True
+        self.weights_updated = False
+        self.stats = {}
+        self.stopped = False
+
+    def run(self):
+        while not self.stopped:
+            self.step()
+
+    def step(self):
+        with self.queue_timer:
+            batch = self.inqueue.get()
+
+        with self.grad_timer:
+            fetches = self.local_evaluator.compute_apply(batch)
+            self.weights_updated = True
+            self.stats = fetches.get("stats", {})
+
+        self.outqueue.put(batch.count)
+        self.learner_queue_size.push(self.inqueue.qsize())
+
+
+class TFMultiGPULearner(LearnerThread):
+    """Learner that can use multiple GPUs and parallel loading."""
+
+    def __init__(self,
+                 local_evaluator,
+                 num_gpus=1,
+                 lr=0.0005,
+                 train_batch_size=500,
+                 grad_clip=40,
+                 num_parallel_data_loaders=1):
+        # Multi-GPU requires TensorFlow to function.
+        import tensorflow as tf
+
+        LearnerThread.__init__(self, local_evaluator)
+        self.lr = lr
+        self.train_batch_size = train_batch_size
+        if not num_gpus:
+            self.devices = ["/cpu:0"]
+        else:
+            self.devices = ["/gpu:{}".format(i) for i in range(num_gpus)]
+            logger.info("TFMultiGPULearner devices {}".format(self.devices))
+        assert self.train_batch_size % len(self.devices) == 0
+        assert self.train_batch_size >= len(self.devices), "batch too small"
+        self.policy = self.local_evaluator.policy_map["default"]
+
+        # per-GPU graph copies created below must share vars with the policy
+        # reuse is set to AUTO_REUSE because Adam nodes are created after
+        # all of the device copies are created.
+        self.par_opt = []
+        with self.local_evaluator.tf_sess.graph.as_default():
+            with self.local_evaluator.tf_sess.as_default():
+                with tf.variable_scope("default", reuse=tf.AUTO_REUSE):
+                    if self.policy._state_inputs:
+                        rnn_inputs = self.policy._state_inputs + [
+                            self.policy._seq_lens
+                        ]
+                    else:
+                        rnn_inputs = []
+                    adam = tf.train.AdamOptimizer(self.lr)
+                    for _ in range(num_parallel_data_loaders):
+                        self.par_opt.append(
+                            LocalSyncParallelOptimizer(
+                                adam,
+                                self.devices,
+                                [v for _, v in self.policy._loss_inputs],
+                                rnn_inputs,
+                                999999,  # it will get rounded down
+                                self.policy.copy,
+                                grad_norm_clipping=grad_clip))
+
+                self.sess = self.local_evaluator.tf_sess
+                self.sess.run(tf.global_variables_initializer())
+
+        self.idle_optimizers = queue.Queue()
+        self.ready_optimizers = queue.Queue()
+        for opt in self.par_opt:
+            self.idle_optimizers.put(opt)
+        for i in range(NUM_DATA_LOAD_THREADS):
+            self.loader_thread = _LoaderThread(self, share_stats=(i == 0))
+            self.loader_thread.start()
+
+    @override(LearnerThread)
+    def step(self):
+        assert self.loader_thread.is_alive()
+        with self.load_wait_timer:
+            opt = self.ready_optimizers.get()
+
+        with self.grad_timer:
+            fetches = opt.optimize(self.sess, 0)
+            self.weights_updated = True
+            self.stats = fetches.get("stats", {})
+
+        self.idle_optimizers.put(opt)
+        self.outqueue.put(self.train_batch_size)
+        self.learner_queue_size.push(self.inqueue.qsize())
+
+
+class _LoaderThread(threading.Thread):
+    def __init__(self, learner, share_stats):
+        threading.Thread.__init__(self)
+        self.learner = learner
+        self.daemon = True
+        if share_stats:
+            self.queue_timer = learner.queue_timer
+            self.load_timer = learner.load_timer
+        else:
+            self.queue_timer = TimerStat()
+            self.load_timer = TimerStat()
+
+    def run(self):
+        while True:
+            self._step()
+
+    def _step(self):
+        s = self.learner
+        with self.queue_timer:
+            batch = s.inqueue.get()
+
+        opt = s.idle_optimizers.get()
+
+        with self.load_timer:
+            tuples = s.policy._get_loss_inputs_dict(batch)
+            data_keys = [ph for _, ph in s.policy._loss_inputs]
+            if s.policy._state_inputs:
+                state_keys = s.policy._state_inputs + [s.policy._seq_lens]
+            else:
+                state_keys = []
+            opt.load_data(s.sess, [tuples[k] for k in data_keys],
+                          [tuples[k] for k in state_keys])
+
+        s.ready_optimizers.put(opt)
diff --git a/python/ray/rllib/optimizers/multi_gpu_impl.py b/python/ray/rllib/optimizers/multi_gpu_impl.py
index 7233e37e93802..c548b20cc022d 100644
--- a/python/ray/rllib/optimizers/multi_gpu_impl.py
+++ b/python/ray/rllib/optimizers/multi_gpu_impl.py
@@ -3,12 +3,15 @@
 from __future__ import print_function
 
 from collections import namedtuple
+import logging
 
 import tensorflow as tf
 
 # Variable scope in which created variables will be placed under
 TOWER_SCOPE_NAME = "tower"
 
+logger = logging.getLogger(__name__)
+
 
 class LocalSyncParallelOptimizer(object):
     """Optimizer that runs in parallel across multiple local devices.
@@ -36,13 +39,13 @@ class LocalSyncParallelOptimizer(object):
             to define the per-device loss ops.
         rnn_inputs: Extra input placeholders for RNN inputs. These will have
             shape [BATCH_SIZE // MAX_SEQ_LEN, ...].
-        per_device_batch_size: Number of tuples to optimize over at a time per
-            device. In each call to `optimize()`,
+        max_per_device_batch_size: Number of tuples to optimize over at a time
+            per device. In each call to `optimize()`,
             `len(devices) * per_device_batch_size` tuples of data will be
-            processed.
+            processed. If this is larger than the total data size, it will be
+            clipped.
         build_graph: Function that takes the specified inputs and returns a
             TF Policy Graph instance.
-        logdir: Directory to place debugging output in.
         grad_norm_clipping: None or int stdev to clip grad norms by
     """
 
@@ -51,26 +54,29 @@ def __init__(self,
                  devices,
                  input_placeholders,
                  rnn_inputs,
-                 per_device_batch_size,
+                 max_per_device_batch_size,
                  build_graph,
-                 logdir,
                  grad_norm_clipping=None):
-        # TODO(rliaw): remove logdir
         self.optimizer = optimizer
         self.devices = devices
-        self.batch_size = per_device_batch_size * len(devices)
-        self.per_device_batch_size = per_device_batch_size
+        self.max_per_device_batch_size = max_per_device_batch_size
         self.loss_inputs = input_placeholders + rnn_inputs
         self.build_graph = build_graph
-        self.logdir = logdir
 
         # First initialize the shared loss network
         with tf.name_scope(TOWER_SCOPE_NAME):
             self._shared_loss = build_graph(self.loss_inputs)
+        shared_ops = tf.get_collection(
+            tf.GraphKeys.UPDATE_OPS, scope=tf.get_variable_scope().name)
 
         # Then setup the per-device loss graphs that use the shared weights
         self._batch_index = tf.placeholder(tf.int32, name="batch_index")
 
+        # Dynamic batch size, which may be shrunk if there isn't enough data
+        self._per_device_batch_size = tf.placeholder(
+            tf.int32, name="per_device_batch_size")
+        self._loaded_per_device_batch_size = max_per_device_batch_size
+
         # When loading RNN input, we dynamically determine the max seq len
         self._max_seq_len = tf.placeholder(tf.int32, name="max_seq_len")
         self._loaded_max_seq_len = 1
@@ -88,10 +94,26 @@ def __init__(self,
 
         avg = average_gradients([t.grads for t in self._towers])
         if grad_norm_clipping:
+            clipped = []
+            for grad, _ in avg:
+                clipped.append(grad)
+            clipped, _ = tf.clip_by_global_norm(clipped, grad_norm_clipping)
             for i, (grad, var) in enumerate(avg):
-                if grad is not None:
-                    avg[i] = (tf.clip_by_norm(grad, grad_norm_clipping), var)
-        self._train_op = self.optimizer.apply_gradients(avg)
+                avg[i] = (clipped[i], var)
+
+        # gather update ops for any batch norm layers. TODO(ekl) here we will
+        # use all the ops found which won't work for DQN / DDPG, but those
+        # aren't supported with multi-gpu right now anyways.
+        self._update_ops = tf.get_collection(
+            tf.GraphKeys.UPDATE_OPS, scope=tf.get_variable_scope().name)
+        for op in shared_ops:
+            self._update_ops.remove(op)  # only care about tower update ops
+        if self._update_ops:
+            logger.debug("Update ops to run on apply gradient: {}".format(
+                self._update_ops))
+
+        with tf.control_dependencies(self._update_ops):
+            self._train_op = self.optimizer.apply_gradients(avg)
 
     def load_data(self, sess, inputs, state_inputs):
         """Bulk loads the specified inputs into device memory.
@@ -117,44 +139,64 @@ def load_data(self, sess, inputs, state_inputs):
         assert len(self.loss_inputs) == len(inputs + state_inputs), \
             (self.loss_inputs, inputs, state_inputs)
 
-        # The RNN truncation case is more complicated
+        # Let's suppose we have the following input data, and 2 devices:
+        # 1 2 3 4 5 6 7                              <- state inputs shape
+        # A A A B B B C C C D D D E E E F F F G G G  <- inputs shape
+        # The data is truncated and split across devices as follows:
+        # |---| seq len = 3
+        # |---------------------------------| seq batch size = 6 seqs
+        # |----------------| per device batch size = 9 tuples
+
         if len(state_inputs) > 0:
+            smallest_array = state_inputs[0]
             seq_len = len(inputs[0]) // len(state_inputs[0])
             self._loaded_max_seq_len = seq_len
-            assert len(state_inputs[0]) * seq_len == len(inputs[0])
-            # Make sure the shorter state inputs arrays are evenly divisible
+        else:
+            smallest_array = inputs[0]
+            self._loaded_max_seq_len = 1
+
+        seq_batch_size = (self.max_per_device_batch_size //
+                          self._loaded_max_seq_len * len(self.devices))
+        if len(smallest_array) < seq_batch_size:
+            # Dynamically shrink the batch size if insufficient data
+            seq_batch_size = make_divisible_by(
+                len(smallest_array), len(self.devices))
+        if seq_batch_size < len(self.devices):
+            raise ValueError("Must load at least 1 tuple sequence per device, "
+                             "got only {} total.".format(len(smallest_array)))
+        self._loaded_per_device_batch_size = (
+            seq_batch_size // len(self.devices) * self._loaded_max_seq_len)
+
+        if len(state_inputs) > 0:
+            # First truncate the RNN state arrays to the seq_batch_size
             state_inputs = [
-                make_divisible_by(arr, self.batch_size) for arr in state_inputs
+                make_divisible_by(arr, seq_batch_size) for arr in state_inputs
             ]
             # Then truncate the data inputs to match
             inputs = [arr[:len(state_inputs[0]) * seq_len] for arr in inputs]
-            assert len(state_inputs[0]) * seq_len == len(inputs[0])
-            assert len(state_inputs[0]) % self.batch_size == 0
+            assert len(state_inputs[0]) * seq_len == len(inputs[0]), \
+                (len(state_inputs[0]), seq_batch_size, seq_len, len(inputs[0]))
             for ph, arr in zip(self.loss_inputs, inputs + state_inputs):
                 feed_dict[ph] = arr
             truncated_len = len(inputs[0])
         else:
             for ph, arr in zip(self.loss_inputs, inputs + state_inputs):
-                truncated_arr = make_divisible_by(arr, self.batch_size)
+                truncated_arr = make_divisible_by(arr, seq_batch_size)
                 feed_dict[ph] = truncated_arr
                 truncated_len = len(truncated_arr)
 
         sess.run([t.init_op for t in self._towers], feed_dict=feed_dict)
 
         tuples_per_device = truncated_len / len(self.devices)
-        assert tuples_per_device > 0, \
-            "Too few tuples per batch, trying increasing the training " \
-            "batch size or decreasing the sgd batch size. Tried to split up " \
-            "{} rows {}-ways in batches of {} (total across devices).".format(
-                len(arr), len(self.devices), self.batch_size)
-        assert tuples_per_device % self.per_device_batch_size == 0
+        assert tuples_per_device > 0, "No data loaded?"
+        assert tuples_per_device % self._loaded_per_device_batch_size == 0
         return tuples_per_device
 
     def optimize(self, sess, batch_index):
         """Run a single step of SGD.
 
         Runs a SGD step over a slice of the preloaded batch with size given by
-        self.per_device_batch_size and offset given by the batch_index
+        self._loaded_per_device_batch_size and offset given by the batch_index
         argument.
 
         Updates shared model weights based on the averaged per-device
@@ -164,13 +206,14 @@ def optimize(self, sess, batch_index):
             sess: TensorFlow session.
             batch_index: Offset into the preloaded data. This value must be
                 between `0` and `tuples_per_device`. The amount of data to
-                process is always fixed to `per_device_batch_size`.
+                process is at most `max_per_device_batch_size`.
 
         Returns:
             The outputs of extra_ops evaluated over the batch.
         """
         feed_dict = {
             self._batch_index: batch_index,
+            self._per_device_batch_size: self._loaded_per_device_batch_size,
             self._max_seq_len: self._loaded_max_seq_len,
         }
         for tower in self._towers:
@@ -213,7 +256,7 @@ def _setup_device(self, device, device_input_placeholders, num_data_in):
                         current_batch,
                         ([self._batch_index // scale * granularity] +
                          [0] * len(ph.shape[1:])),
-                        ([self.per_device_batch_size // scale * granularity] +
+                        ([self._per_device_batch_size // scale * granularity] +
                          [-1] * len(ph.shape[1:])))
                     current_slice.set_shape(ph.shape)
                     device_input_slices.append(current_slice)
@@ -229,8 +272,10 @@ def _setup_device(self, device, device_input_placeholders, num_data_in):
 Tower = namedtuple("Tower", ["init_op", "grads", "loss_graph"])
 
 
-def make_divisible_by(array, n):
-    return array[0:array.shape[0] - array.shape[0] % n]
+def make_divisible_by(a, n):
+    if type(a) is int:
+        return a - a % n
+    return a[0:a.shape[0] - a.shape[0] % n]
 
 
 def average_gradients(tower_grads):
diff --git a/python/ray/rllib/optimizers/multi_gpu_optimizer.py b/python/ray/rllib/optimizers/multi_gpu_optimizer.py
index e474570363937..5ca29f68c8861 100644
--- a/python/ray/rllib/optimizers/multi_gpu_optimizer.py
+++ b/python/ray/rllib/optimizers/multi_gpu_optimizer.py
@@ -2,16 +2,22 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
+import math
 import numpy as np
 from collections import defaultdict
-import os
 import tensorflow as tf
 
 import ray
 from ray.rllib.evaluation.tf_policy_graph import TFPolicyGraph
 from ray.rllib.optimizers.policy_optimizer import PolicyOptimizer
 from ray.rllib.optimizers.multi_gpu_impl import LocalSyncParallelOptimizer
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.timer import TimerStat
+from ray.rllib.evaluation.sample_batch import SampleBatch, DEFAULT_POLICY_ID, \
+    MultiAgentBatch
+
+logger = logging.getLogger(__name__)
 
 
 class LocalMultiGPUOptimizer(PolicyOptimizer):
@@ -30,6 +36,7 @@ class LocalMultiGPUOptimizer(PolicyOptimizer):
     may result in unexpected behavior.
     """
 
+    @override(PolicyOptimizer)
     def _init(self,
               sgd_batch_size=128,
               num_sgd_iter=10,
@@ -42,7 +49,9 @@ def _init(self,
         if not num_gpus:
             self.devices = ["/cpu:0"]
         else:
-            self.devices = ["/gpu:{}".format(i) for i in range(num_gpus)]
+            self.devices = [
+                "/gpu:{}".format(i) for i in range(int(math.ceil(num_gpus)))
+            ]
         self.batch_size = int(sgd_batch_size / len(self.devices)) * len(
             self.devices)
         assert self.batch_size % len(self.devices) == 0
@@ -54,39 +63,40 @@ def _init(self,
         self.update_weights_timer = TimerStat()
         self.standardize_fields = standardize_fields
 
-        print("LocalMultiGPUOptimizer devices", self.devices)
+        logger.info("LocalMultiGPUOptimizer devices {}".format(self.devices))
 
-        if set(self.local_evaluator.policy_map.keys()) != {"default"}:
-            raise ValueError(
-                "Multi-agent is not supported with multi-GPU. Try using the "
-                "simple optimizer instead.")
-        self.policy = self.local_evaluator.policy_map["default"]
-        if not isinstance(self.policy, TFPolicyGraph):
-            raise ValueError(
-                "Only TF policies are supported with multi-GPU. Try using the "
-                "simple optimizer instead.")
+        self.policies = self.local_evaluator.policy_map
+        for policy_id, policy in self.policies.items():
+            if not isinstance(policy, TFPolicyGraph):
+                raise ValueError(
+                    "Only TF policies are supported with multi-GPU. Try using "
+                    "the simple optimizer instead.")
 
         # per-GPU graph copies created below must share vars with the policy
         # reuse is set to AUTO_REUSE because Adam nodes are created after
         # all of the device copies are created.
+        self.optimizers = {}
         with self.local_evaluator.tf_sess.graph.as_default():
             with self.local_evaluator.tf_sess.as_default():
-                with tf.variable_scope("default", reuse=tf.AUTO_REUSE):
-                    if self.policy._state_inputs:
-                        rnn_inputs = self.policy._state_inputs + [
-                            self.policy._seq_lens
-                        ]
-                    else:
-                        rnn_inputs = []
-                    self.par_opt = LocalSyncParallelOptimizer(
-                        self.policy.optimizer(), self.devices,
-                        [v for _, v in self.policy.loss_inputs()], rnn_inputs,
-                        self.per_device_batch_size, self.policy.copy,
-                        os.getcwd())
+                for policy_id, policy in self.policies.items():
+                    with tf.variable_scope(policy_id, reuse=tf.AUTO_REUSE):
+                        if policy._state_inputs:
+                            rnn_inputs = policy._state_inputs + [
+                                policy._seq_lens
+                            ]
+                        else:
+                            rnn_inputs = []
+                        self.optimizers[policy_id] = (
+                            LocalSyncParallelOptimizer(
+                                policy._optimizer, self.devices,
+                                [v
+                                 for _, v in policy._loss_inputs], rnn_inputs,
+                                self.per_device_batch_size, policy.copy))
 
                 self.sess = self.local_evaluator.tf_sess
                 self.sess.run(tf.global_variables_initializer())
 
+    @override(PolicyOptimizer)
     def step(self):
         with self.update_weights_timer:
             if self.remote_evaluators:
@@ -102,48 +112,64 @@ def step(self):
                                           self.train_batch_size)
             else:
                 samples = self.local_evaluator.sample()
-            self._check_not_multiagent(samples)
-
-        for field in self.standardize_fields:
-            value = samples[field]
-            standardized = (value - value.mean()) / max(1e-4, value.std())
-            samples[field] = standardized
-
-        # Important: don't shuffle RNN sequence elements
-        if not self.policy._state_inputs:
-            samples.shuffle()
-
+            # Handle everything as if multiagent
+            if isinstance(samples, SampleBatch):
+                samples = MultiAgentBatch({
+                    DEFAULT_POLICY_ID: samples
+                }, samples.count)
+
+        for _, batch in samples.policy_batches.items():
+            for field in self.standardize_fields:
+                value = batch[field]
+                standardized = (value - value.mean()) / max(1e-4, value.std())
+                batch[field] = standardized
+
+        for policy_id, policy in self.policies.items():
+            # Important: don't shuffle RNN sequence elements
+            if (policy_id in samples.policy_batches
+                    and not policy._state_inputs):
+                samples.policy_batches[policy_id].shuffle()
+
+        num_loaded_tuples = {}
         with self.load_timer:
-            tuples = self.policy._get_loss_inputs_dict(samples)
-            data_keys = [ph for _, ph in self.policy.loss_inputs()]
-            if self.policy._state_inputs:
-                state_keys = (
-                    self.policy._state_inputs + [self.policy._seq_lens])
-            else:
-                state_keys = []
-            tuples_per_device = self.par_opt.load_data(
-                self.sess, [tuples[k] for k in data_keys],
-                [tuples[k] for k in state_keys])
-
+            for policy_id, batch in samples.policy_batches.items():
+                policy = self.policies[policy_id]
+                tuples = policy._get_loss_inputs_dict(batch)
+                data_keys = [ph for _, ph in policy._loss_inputs]
+                if policy._state_inputs:
+                    state_keys = policy._state_inputs + [policy._seq_lens]
+                else:
+                    state_keys = []
+                num_loaded_tuples[policy_id] = (
+                    self.optimizers[policy_id].load_data(
+                        self.sess, [tuples[k] for k in data_keys],
+                        [tuples[k] for k in state_keys]))
+
+        fetches = {}
         with self.grad_timer:
-            num_batches = (
-                int(tuples_per_device) // int(self.per_device_batch_size))
-            print("== sgd epochs ==")
-            for i in range(self.num_sgd_iter):
-                iter_extra_fetches = defaultdict(list)
-                permutation = np.random.permutation(num_batches)
-                for batch_index in range(num_batches):
-                    batch_fetches = self.par_opt.optimize(
-                        self.sess,
-                        permutation[batch_index] * self.per_device_batch_size)
-                    for k, v in batch_fetches.items():
-                        iter_extra_fetches[k].append(v)
-                print(i, _averaged(iter_extra_fetches))
+            for policy_id, tuples_per_device in num_loaded_tuples.items():
+                optimizer = self.optimizers[policy_id]
+                num_batches = (
+                    int(tuples_per_device) // int(self.per_device_batch_size))
+                logger.debug("== sgd epochs for {} ==".format(policy_id))
+                for i in range(self.num_sgd_iter):
+                    iter_extra_fetches = defaultdict(list)
+                    permutation = np.random.permutation(num_batches)
+                    for batch_index in range(num_batches):
+                        batch_fetches = optimizer.optimize(
+                            self.sess, permutation[batch_index] *
+                            self.per_device_batch_size)
+                        for k, v in batch_fetches.items():
+                            iter_extra_fetches[k].append(v)
+                    logger.debug("{} {}".format(i,
+                                                _averaged(iter_extra_fetches)))
+                fetches[policy_id] = _averaged(iter_extra_fetches)
 
         self.num_steps_sampled += samples.count
         self.num_steps_trained += samples.count
-        return _averaged(iter_extra_fetches)
+        return fetches
 
+    @override(PolicyOptimizer)
     def stats(self):
         return dict(
             PolicyOptimizer.stats(self), **{
diff --git a/python/ray/rllib/optimizers/policy_optimizer.py b/python/ray/rllib/optimizers/policy_optimizer.py
index 21fcf5f0b7a77..a0cc085eec898 100644
--- a/python/ray/rllib/optimizers/policy_optimizer.py
+++ b/python/ray/rllib/optimizers/policy_optimizer.py
@@ -2,10 +2,13 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
+
 import ray
 from ray.rllib.evaluation.policy_evaluator import PolicyEvaluator
 from ray.rllib.evaluation.metrics import collect_episodes, summarize_episodes
-from ray.rllib.evaluation.sample_batch import MultiAgentBatch
+
+logger = logging.getLogger(__name__)
 
 
 class PolicyOptimizer(object):
@@ -53,10 +56,13 @@ def __init__(self, local_evaluator, remote_evaluators=None, config=None):
         self.num_steps_trained = 0
         self.num_steps_sampled = 0
 
+        logger.debug("Created policy optimizer with {}: {}".format(
+            config, self))
+
     def _init(self):
         """Subclasses should prefer overriding this instead of __init__."""
 
-        pass
+        raise NotImplementedError
 
     def step(self):
         """Takes a logical optimization step.
@@ -79,18 +85,42 @@ def stats(self):
             "num_steps_sampled": self.num_steps_sampled,
         }
 
-    def collect_metrics(self, min_history=100):
+    def save(self):
+        """Returns a serializable object representing the optimizer state."""
+
+        return [self.num_steps_trained, self.num_steps_sampled]
+
+    def restore(self, data):
+        """Restores optimizer state from the given data object."""
+
+        self.num_steps_trained = data[0]
+        self.num_steps_sampled = data[1]
+
+    def stop(self):
+        """Release any resources used by this optimizer."""
+        pass
+
+    def collect_metrics(self,
+                        timeout_seconds,
+                        min_history=100,
+                        selected_evaluators=None):
         """Returns evaluator and optimizer stats.
 
         Arguments:
+            timeout_seconds (int): Max wait time for a evaluator before
+                dropping its results. This usually indicates a hung evaluator.
             min_history (int): Min history length to smooth results over.
+            selected_evaluators (list): Override the list of remote evaluators
+                to collect metrics from.
 
         Returns:
             res (dict): A training result dict from evaluator metrics with
                 `info` replaced with stats from self.
         """
-        episodes = collect_episodes(self.local_evaluator,
-                                    self.remote_evaluators)
+        episodes, num_dropped = collect_episodes(
+            self.local_evaluator,
+            selected_evaluators or self.remote_evaluators,
+            timeout_seconds=timeout_seconds)
         orig_episodes = list(episodes)
         missing = min_history - len(episodes)
         if missing > 0:
@@ -98,21 +128,10 @@ def collect_metrics(self, min_history=100):
             assert len(episodes) <= min_history
         self.episode_history.extend(orig_episodes)
         self.episode_history = self.episode_history[-min_history:]
-        res = summarize_episodes(episodes, orig_episodes)
+        res = summarize_episodes(episodes, orig_episodes, num_dropped)
         res.update(info=self.stats())
         return res
 
-    def save(self):
-        """Returns a serializable object representing the optimizer state."""
-
-        return [self.num_steps_trained, self.num_steps_sampled]
-
-    def restore(self, data):
-        """Restores optimizer state from the given data object."""
-
-        self.num_steps_trained = data[0]
-        self.num_steps_sampled = data[1]
-
     def foreach_evaluator(self, func):
         """Apply the given function to each evaluator instance."""
 
@@ -134,12 +153,6 @@ def foreach_evaluator_with_index(self, func):
         ])
         return local_result + remote_results
 
-    @staticmethod
-    def _check_not_multiagent(sample_batch):
-        if isinstance(sample_batch, MultiAgentBatch):
-            raise NotImplementedError(
-                "This optimizer does not support multi-agent yet.")
-
     @classmethod
     def make(cls,
              env_creator,
diff --git a/python/ray/rllib/optimizers/replay_buffer.py b/python/ray/rllib/optimizers/replay_buffer.py
index 77d954345668f..cd5ec732848e0 100644
--- a/python/ray/rllib/optimizers/replay_buffer.py
+++ b/python/ray/rllib/optimizers/replay_buffer.py
@@ -93,14 +93,15 @@ def sample(self, batch_size):
         self._num_sampled += batch_size
         return self._encode_sample(idxes)
 
-    def stats(self):
+    def stats(self, debug=False):
         data = {
             "added_count": self._num_added,
             "sampled_count": self._num_sampled,
             "est_size_bytes": self._est_size_bytes,
             "num_entries": len(self._storage),
         }
-        data.update(self._evicted_hit_stats.stats())
+        if debug:
+            data.update(self._evicted_hit_stats.stats())
         return data
 
 
@@ -233,7 +234,8 @@ def update_priorities(self, idxes, priorities):
 
             self._max_priority = max(self._max_priority, priority)
 
-    def stats(self):
-        parent = ReplayBuffer.stats(self)
-        parent.update(self._prio_change_stats.stats())
+    def stats(self, debug=False):
+        parent = ReplayBuffer.stats(self, debug)
+        if debug:
+            parent.update(self._prio_change_stats.stats())
         return parent
diff --git a/python/ray/rllib/optimizers/sync_replay_optimizer.py b/python/ray/rllib/optimizers/sync_replay_optimizer.py
index 73df006014679..f2a42a08302a5 100644
--- a/python/ray/rllib/optimizers/sync_replay_optimizer.py
+++ b/python/ray/rllib/optimizers/sync_replay_optimizer.py
@@ -11,6 +11,7 @@
 from ray.rllib.optimizers.policy_optimizer import PolicyOptimizer
 from ray.rllib.evaluation.sample_batch import SampleBatch, DEFAULT_POLICY_ID, \
     MultiAgentBatch
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.compression import pack_if_needed
 from ray.rllib.utils.filter import RunningStat
 from ray.rllib.utils.timer import TimerStat
@@ -24,6 +25,7 @@ class SyncReplayOptimizer(PolicyOptimizer):
     "td_error" array in the info return of compute_gradients(). This error
     term will be used for sample prioritization."""
 
+    @override(PolicyOptimizer)
     def _init(self,
               learning_starts=1000,
               buffer_size=10000,
@@ -53,6 +55,7 @@ def _init(self,
         self.replay_timer = TimerStat()
         self.grad_timer = TimerStat()
         self.throughput = RunningStat()
+        self.learner_stats = {}
 
         # Set up replay buffer
         if prioritized_replay:
@@ -69,6 +72,7 @@ def new_buffer():
 
         assert buffer_size >= self.replay_starts
 
+    @override(PolicyOptimizer)
     def step(self):
         with self.update_weights_timer:
             if self.remote_evaluators:
@@ -105,12 +109,29 @@ def step(self):
 
         self.num_steps_sampled += batch.count
 
+    @override(PolicyOptimizer)
+    def stats(self):
+        return dict(
+            PolicyOptimizer.stats(self), **{
+                "sample_time_ms": round(1000 * self.sample_timer.mean, 3),
+                "replay_time_ms": round(1000 * self.replay_timer.mean, 3),
+                "grad_time_ms": round(1000 * self.grad_timer.mean, 3),
+                "update_time_ms": round(1000 * self.update_weights_timer.mean,
+                                        3),
+                "opt_peak_throughput": round(self.grad_timer.mean_throughput,
+                                             3),
+                "opt_samples": round(self.grad_timer.mean_units_processed, 3),
+                "learner": self.learner_stats,
+            })
+
     def _optimize(self):
         samples = self._replay()
 
         with self.grad_timer:
             info_dict = self.local_evaluator.compute_apply(samples)
             for policy_id, info in info_dict.items():
+                if "stats" in info:
+                    self.learner_stats[policy_id] = info["stats"]
                 replay_buffer = self.replay_buffers[policy_id]
                 if isinstance(replay_buffer, PrioritizedReplayBuffer):
                     td_error = info["td_error"]
@@ -148,16 +169,3 @@ def _replay(self):
                 "batch_indexes": batch_indexes
             })
         return MultiAgentBatch(samples, self.train_batch_size)
-
-    def stats(self):
-        return dict(
-            PolicyOptimizer.stats(self), **{
-                "sample_time_ms": round(1000 * self.sample_timer.mean, 3),
-                "replay_time_ms": round(1000 * self.replay_timer.mean, 3),
-                "grad_time_ms": round(1000 * self.grad_timer.mean, 3),
-                "update_time_ms": round(1000 * self.update_weights_timer.mean,
-                                        3),
-                "opt_peak_throughput": round(self.grad_timer.mean_throughput,
-                                             3),
-                "opt_samples": round(self.grad_timer.mean_units_processed, 3),
-            })
diff --git a/python/ray/rllib/optimizers/sync_samples_optimizer.py b/python/ray/rllib/optimizers/sync_samples_optimizer.py
index 20922ff54036a..b78e3ed01d70e 100644
--- a/python/ray/rllib/optimizers/sync_samples_optimizer.py
+++ b/python/ray/rllib/optimizers/sync_samples_optimizer.py
@@ -3,11 +3,15 @@
 from __future__ import print_function
 
 import ray
+import logging
 from ray.rllib.optimizers.policy_optimizer import PolicyOptimizer
 from ray.rllib.evaluation.sample_batch import SampleBatch
+from ray.rllib.utils.annotations import override
 from ray.rllib.utils.filter import RunningStat
 from ray.rllib.utils.timer import TimerStat
 
+logger = logging.getLogger(__name__)
+
 
 class SyncSamplesOptimizer(PolicyOptimizer):
     """A simple synchronous RL optimizer.
@@ -17,6 +21,7 @@ class SyncSamplesOptimizer(PolicyOptimizer):
     model weights are then broadcast to all remote evaluators.
     """
 
+    @override(PolicyOptimizer)
     def _init(self, num_sgd_iter=1, train_batch_size=1):
         self.update_weights_timer = TimerStat()
         self.sample_timer = TimerStat()
@@ -26,6 +31,7 @@ def _init(self, num_sgd_iter=1, train_batch_size=1):
         self.train_batch_size = train_batch_size
         self.learner_stats = {}
 
+    @override(PolicyOptimizer)
     def step(self):
         with self.update_weights_timer:
             if self.remote_evaluators:
@@ -52,13 +58,14 @@ def step(self):
                 if "stats" in fetches:
                     self.learner_stats = fetches["stats"]
                 if self.num_sgd_iter > 1:
-                    print(i, fetches)
+                    logger.debug("{} {}".format(i, fetches))
             self.grad_timer.push_units_processed(samples.count)
 
         self.num_steps_sampled += samples.count
         self.num_steps_trained += samples.count
         return fetches
 
+    @override(PolicyOptimizer)
     def stats(self):
         return dict(
             PolicyOptimizer.stats(self), **{
diff --git a/python/ray/rllib/rollout.py b/python/ray/rllib/rollout.py
index 0e33e3d6ced61..bee5c5eb2ae12 100755
--- a/python/ray/rllib/rollout.py
+++ b/python/ray/rllib/rollout.py
@@ -12,8 +12,6 @@
 import gym
 import ray
 from ray.rllib.agents.agent import get_agent_class
-from ray.rllib.agents.dqn.common.wrappers import wrap_dqn
-from ray.rllib.models import ModelCatalog
 
 EXAMPLE_USAGE = """
 Example Usage via RLlib CLI:
@@ -54,7 +52,7 @@ def create_parser(parser_creator=None):
         const=True,
         help="Surpress rendering of the environment.")
     parser.add_argument(
-        "--steps", default=None, help="Number of steps to roll out.")
+        "--steps", default=10000, help="Number of steps to roll out.")
     parser.add_argument("--out", default=None, help="Output filename.")
     parser.add_argument(
         "--config",
@@ -66,30 +64,38 @@ def create_parser(parser_creator=None):
 
 
 def run(args, parser):
-    if not args.config:
+    config = args.config
+    if not config:
         # Load configuration from file
         config_dir = os.path.dirname(args.checkpoint)
         config_path = os.path.join(config_dir, "params.json")
+        if not os.path.exists(config_path):
+            config_path = os.path.join(config_dir, "../params.json")
+        if not os.path.exists(config_path):
+            raise ValueError(
+                "Could not find params.json in either the checkpoint dir or "
+                "its parent directory.")
         with open(config_path) as f:
-            args.config = json.load(f)
+            config = json.load(f)
+        if "num_workers" in config:
+            config["num_workers"] = min(2, config["num_workers"])
 
     if not args.env:
-        if not args.config.get("env"):
+        if not config.get("env"):
             parser.error("the following arguments are required: --env")
-        args.env = args.config.get("env")
+        args.env = config.get("env")
 
     ray.init()
 
     cls = get_agent_class(args.run)
-    agent = cls(env=args.env, config=args.config)
+    agent = cls(env=args.env, config=config)
     agent.restore(args.checkpoint)
     num_steps = int(args.steps)
 
-    if args.run == "DQN":
-        env = gym.make(args.env)
-        env = wrap_dqn(env, args.config.get("model", {}))
+    if hasattr(agent, "local_evaluator"):
+        env = agent.local_evaluator.env
     else:
-        env = ModelCatalog.get_preprocessor_as_wrapper(gym.make(args.env))
+        env = gym.make(args.env)
     if args.out is not None:
         rollouts = []
     steps = 0
diff --git a/python/ray/rllib/scripts.py b/python/ray/rllib/scripts.py
index cc48b83cf3341..88d5d56292b13 100644
--- a/python/ray/rllib/scripts.py
+++ b/python/ray/rllib/scripts.py
@@ -14,7 +14,7 @@
     rllib train --run DQN --env CartPole-v0
 
 Example usage for rollout:
-    rllib rollout /tmp/ray/checkpoint_dir/checkpoint-0 --run DQN
+    rllib rollout /trial_dir/checkpoint_1/checkpoint-1 --run DQN
 """
 
 
diff --git a/python/ray/rllib/test/test_catalog.py b/python/ray/rllib/test/test_catalog.py
index e3dc1e782535d..efa1aba0e2f07 100644
--- a/python/ray/rllib/test/test_catalog.py
+++ b/python/ray/rllib/test/test_catalog.py
@@ -15,16 +15,18 @@
 
 
 class CustomPreprocessor(Preprocessor):
-    pass
+    def _init_shape(self, obs_space, options):
+        return None
 
 
 class CustomPreprocessor2(Preprocessor):
-    pass
+    def _init_shape(self, obs_space, options):
+        return None
 
 
 class CustomModel(Model):
     def _build_layers(self, *args):
-        return None, None
+        return tf.constant([[0] * 5]), None
 
 
 class ModelCatalogTest(unittest.TestCase):
@@ -69,19 +71,24 @@ def testDefaultModels(self):
         ray.init()
 
         with tf.variable_scope("test1"):
-            p1 = ModelCatalog.get_model(np.zeros((10, 3), dtype=np.float32), 5)
+            p1 = ModelCatalog.get_model({
+                "obs": tf.zeros((10, 3), dtype=tf.float32)
+            }, Box(0, 1, shape=(3, ), dtype=np.float32), 5, {})
             self.assertEqual(type(p1), FullyConnectedNetwork)
 
         with tf.variable_scope("test2"):
-            p2 = ModelCatalog.get_model(
-                np.zeros((10, 84, 84, 3), dtype=np.float32), 5)
+            p2 = ModelCatalog.get_model({
+                "obs": tf.zeros((10, 84, 84, 3), dtype=tf.float32)
+            }, Box(0, 1, shape=(84, 84, 3), dtype=np.float32), 5, {})
             self.assertEqual(type(p2), VisionNetwork)
 
     def testCustomModel(self):
         ray.init()
         ModelCatalog.register_custom_model("foo", CustomModel)
-        p1 = ModelCatalog.get_model(
-            tf.constant([1, 2, 3]), 5, {"custom_model": "foo"})
+        p1 = ModelCatalog.get_model({
+            "obs": tf.constant([1, 2, 3])
+        }, Box(0, 1, shape=(3, ), dtype=np.float32), 5,
+                                    {"custom_model": "foo"})
         self.assertEqual(str(type(p1)), str(CustomModel))
 
 
diff --git a/python/ray/rllib/test/test_checkpoint_restore.py b/python/ray/rllib/test/test_checkpoint_restore.py
index cb371c90c29f8..aa8fac28086ab 100644
--- a/python/ray/rllib/test/test_checkpoint_restore.py
+++ b/python/ray/rllib/test/test_checkpoint_restore.py
@@ -23,7 +23,8 @@ def get_mean_action(alg, obs):
     "ES": {
         "episodes_per_batch": 10,
         "train_batch_size": 100,
-        "num_workers": 2
+        "num_workers": 2,
+        "observation_filter": "MeanStdFilter"
     },
     "DQN": {},
     "APEX_DDPG": {
@@ -46,6 +47,11 @@ def get_mean_action(alg, obs):
     "A3C": {
         "num_workers": 1
     },
+    "ARS": {
+        "num_rollouts": 10,
+        "num_workers": 2,
+        "observation_filter": "MeanStdFilter"
+    }
 }
 
 
@@ -83,7 +89,7 @@ def test(use_object_store, alg_name, failures):
 if __name__ == "__main__":
     failures = []
     for use_object_store in [False, True]:
-        for name in ["ES", "DQN", "DDPG", "PPO", "A3C", "APEX_DDPG"]:
+        for name in ["ES", "DQN", "DDPG", "PPO", "A3C", "APEX_DDPG", "ARS"]:
             test(use_object_store, name, failures)
 
     assert not failures, failures
diff --git a/python/ray/rllib/test/test_env_with_subprocess.py b/python/ray/rllib/test/test_env_with_subprocess.py
new file mode 100644
index 0000000000000..fc940cdea05eb
--- /dev/null
+++ b/python/ray/rllib/test/test_env_with_subprocess.py
@@ -0,0 +1,78 @@
+"""Tests that envs clean up after themselves on agent exit."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from gym.spaces import Discrete
+import atexit
+import gym
+import os
+import subprocess
+import tempfile
+import time
+
+import ray
+from ray.tune import run_experiments
+from ray.tune.registry import register_env
+
+# Dummy command to run as a subprocess with a unique name
+UNIQUE_CMD = "sleep {}".format(str(time.time()))
+_, UNIQUE_FILE_0 = tempfile.mkstemp("test_env_with_subprocess")
+_, UNIQUE_FILE_1 = tempfile.mkstemp("test_env_with_subprocess")
+
+
+class EnvWithSubprocess(gym.Env):
+    """Our env that spawns a subprocess."""
+
+    def __init__(self, config):
+        self.action_space = Discrete(2)
+        self.observation_space = Discrete(2)
+        # Subprocess that should be cleaned up
+        self.subproc = subprocess.Popen(UNIQUE_CMD.split(" "), shell=False)
+        # Exit handler should be called
+        if config.worker_index == 0:
+            atexit.register(lambda: os.unlink(UNIQUE_FILE_0))
+        else:
+            atexit.register(lambda: os.unlink(UNIQUE_FILE_1))
+        atexit.register(lambda: self.subproc.kill())
+
+    def reset(self):
+        return 0
+
+    def step(self, action):
+        return 0, 0, True, {}
+
+
+def leaked_processes():
+    """Returns whether any subprocesses were leaked."""
+    result = subprocess.check_output(
+        "ps aux | grep '{}' | grep -v grep || true".format(UNIQUE_CMD),
+        shell=True)
+    return result
+
+
+if __name__ == "__main__":
+    register_env("subproc", lambda config: EnvWithSubprocess(config))
+    ray.init()
+    assert os.path.exists(UNIQUE_FILE_0)
+    assert os.path.exists(UNIQUE_FILE_1)
+    assert not leaked_processes()
+    run_experiments({
+        "demo": {
+            "run": "PG",
+            "env": "subproc",
+            "num_samples": 1,
+            "config": {
+                "num_workers": 1,
+            },
+            "stop": {
+                "training_iteration": 1
+            },
+        },
+    })
+    leaked = leaked_processes()
+    assert not leaked, "LEAKED PROCESSES: {}".format(leaked)
+    assert not os.path.exists(UNIQUE_FILE_0), "atexit handler not called"
+    assert not os.path.exists(UNIQUE_FILE_1), "atexit handler not called"
+    print("OK")
diff --git a/python/ray/rllib/test/test_evaluators.py b/python/ray/rllib/test/test_evaluators.py
index 9ae0994f33466..c7a72d7a5bb87 100644
--- a/python/ray/rllib/test/test_evaluators.py
+++ b/python/ray/rllib/test/test_evaluators.py
@@ -4,7 +4,7 @@
 
 import unittest
 
-from ray.rllib.agents.dqn.dqn_policy_graph import adjust_nstep
+from ray.rllib.agents.dqn.dqn_policy_graph import _adjust_nstep
 
 
 class DQNTest(unittest.TestCase):
@@ -14,7 +14,7 @@ def testNStep(self):
         rewards = [10.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0]
         new_obs = [2, 3, 4, 5, 6, 7, 8]
         dones = [0, 0, 0, 0, 0, 0, 1]
-        adjust_nstep(3, 0.9, obs, actions, rewards, new_obs, dones)
+        _adjust_nstep(3, 0.9, obs, actions, rewards, new_obs, dones)
         self.assertEqual(obs, [1, 2, 3, 4, 5, 6, 7])
         self.assertEqual(actions, ["a", "b", "a", "a", "a", "b", "a"])
         self.assertEqual(new_obs, [4, 5, 6, 7, 8, 8, 8])
diff --git a/python/ray/rllib/test/test_serving_env.py b/python/ray/rllib/test/test_external_env.py
similarity index 88%
rename from python/ray/rllib/test/test_serving_env.py
rename to python/ray/rllib/test/test_external_env.py
index 6f47eeeeeedd8..f7e8308a5ff17 100644
--- a/python/ray/rllib/test/test_serving_env.py
+++ b/python/ray/rllib/test/test_external_env.py
@@ -12,15 +12,15 @@
 from ray.rllib.agents.dqn import DQNAgent
 from ray.rllib.agents.pg import PGAgent
 from ray.rllib.evaluation.policy_evaluator import PolicyEvaluator
-from ray.rllib.env.serving_env import ServingEnv
+from ray.rllib.env.external_env import ExternalEnv
 from ray.rllib.test.test_policy_evaluator import BadPolicyGraph, \
     MockPolicyGraph, MockEnv
 from ray.tune.registry import register_env
 
 
-class SimpleServing(ServingEnv):
+class SimpleServing(ExternalEnv):
     def __init__(self, env):
-        ServingEnv.__init__(self, env.action_space, env.observation_space)
+        ExternalEnv.__init__(self, env.action_space, env.observation_space)
         self.env = env
 
     def run(self):
@@ -36,9 +36,9 @@ def run(self):
                 eid = self.start_episode()
 
 
-class PartOffPolicyServing(ServingEnv):
+class PartOffPolicyServing(ExternalEnv):
     def __init__(self, env, off_pol_frac):
-        ServingEnv.__init__(self, env.action_space, env.observation_space)
+        ExternalEnv.__init__(self, env.action_space, env.observation_space)
         self.env = env
         self.off_pol_frac = off_pol_frac
 
@@ -59,9 +59,9 @@ def run(self):
                 eid = self.start_episode()
 
 
-class SimpleOffPolicyServing(ServingEnv):
+class SimpleOffPolicyServing(ExternalEnv):
     def __init__(self, env, fixed_action):
-        ServingEnv.__init__(self, env.action_space, env.observation_space)
+        ExternalEnv.__init__(self, env.action_space, env.observation_space)
         self.env = env
         self.fixed_action = fixed_action
 
@@ -79,12 +79,12 @@ def run(self):
                 eid = self.start_episode()
 
 
-class MultiServing(ServingEnv):
+class MultiServing(ExternalEnv):
     def __init__(self, env_creator):
         self.env_creator = env_creator
         self.env = env_creator()
-        ServingEnv.__init__(self, self.env.action_space,
-                            self.env.observation_space)
+        ExternalEnv.__init__(self, self.env.action_space,
+                             self.env.observation_space)
 
     def run(self):
         envs = [self.env_creator() for _ in range(5)]
@@ -107,8 +107,8 @@ def run(self):
                     del cur_obs[i]
 
 
-class TestServingEnv(unittest.TestCase):
-    def testServingEnvCompleteEpisodes(self):
+class TestExternalEnv(unittest.TestCase):
+    def testExternalEnvCompleteEpisodes(self):
         ev = PolicyEvaluator(
             env_creator=lambda _: SimpleServing(MockEnv(25)),
             policy_graph=MockPolicyGraph,
@@ -118,7 +118,7 @@ def testServingEnvCompleteEpisodes(self):
             batch = ev.sample()
             self.assertEqual(batch.count, 50)
 
-    def testServingEnvTruncateEpisodes(self):
+    def testExternalEnvTruncateEpisodes(self):
         ev = PolicyEvaluator(
             env_creator=lambda _: SimpleServing(MockEnv(25)),
             policy_graph=MockPolicyGraph,
@@ -128,7 +128,7 @@ def testServingEnvTruncateEpisodes(self):
             batch = ev.sample()
             self.assertEqual(batch.count, 40)
 
-    def testServingEnvOffPolicy(self):
+    def testExternalEnvOffPolicy(self):
         ev = PolicyEvaluator(
             env_creator=lambda _: SimpleOffPolicyServing(MockEnv(25), 42),
             policy_graph=MockPolicyGraph,
@@ -140,7 +140,7 @@ def testServingEnvOffPolicy(self):
             self.assertEqual(batch["actions"][0], 42)
             self.assertEqual(batch["actions"][-1], 42)
 
-    def testServingEnvBadActions(self):
+    def testExternalEnvBadActions(self):
         ev = PolicyEvaluator(
             env_creator=lambda _: SimpleServing(MockEnv(25)),
             policy_graph=BadPolicyGraph,
@@ -185,15 +185,14 @@ def testTrainCartpoleMulti(self):
                 return
         raise Exception("failed to improve reward")
 
-    def testServingEnvHorizonNotSupported(self):
+    def testExternalEnvHorizonNotSupported(self):
         ev = PolicyEvaluator(
             env_creator=lambda _: SimpleServing(MockEnv(25)),
             policy_graph=MockPolicyGraph,
             episode_horizon=20,
             batch_steps=10,
             batch_mode="complete_episodes")
-        ev.sample()
-        self.assertRaises(Exception, lambda: ev.sample())
+        self.assertRaises(ValueError, lambda: ev.sample())
 
 
 if __name__ == '__main__':
diff --git a/python/ray/rllib/test/test_lstm.py b/python/ray/rllib/test/test_lstm.py
index 2abfb7680cd3d..abb9ad0ccb4a7 100644
--- a/python/ray/rllib/test/test_lstm.py
+++ b/python/ray/rllib/test/test_lstm.py
@@ -10,10 +10,12 @@
 class LSTMUtilsTest(unittest.TestCase):
     def testBasic(self):
         eps_ids = [1, 1, 1, 5, 5, 5, 5, 5]
+        agent_ids = [1, 1, 1, 1, 1, 1, 1, 1]
         f = [[101, 102, 103, 201, 202, 203, 204, 205],
              [[101], [102], [103], [201], [202], [203], [204], [205]]]
         s = [[209, 208, 207, 109, 108, 107, 106, 105]]
-        f_pad, s_init, seq_lens = chop_into_sequences(eps_ids, f, s, 4)
+        f_pad, s_init, seq_lens = chop_into_sequences(eps_ids, agent_ids, f, s,
+                                                      4)
         self.assertEqual([f.tolist() for f in f_pad], [
             [101, 102, 103, 0, 201, 202, 203, 204, 205, 0, 0, 0],
             [[101], [102], [103], [0], [201], [202], [203], [204], [205], [0],
@@ -22,11 +24,25 @@ def testBasic(self):
         self.assertEqual([s.tolist() for s in s_init], [[209, 109, 105]])
         self.assertEqual(seq_lens.tolist(), [3, 4, 1])
 
+    def testMultiAgent(self):
+        eps_ids = [1, 1, 1, 5, 5, 5, 5, 5]
+        agent_ids = [1, 1, 2, 1, 1, 2, 2, 3]
+        f = [[101, 102, 103, 201, 202, 203, 204, 205],
+             [[101], [102], [103], [201], [202], [203], [204], [205]]]
+        s = [[209, 208, 207, 109, 108, 107, 106, 105]]
+        f_pad, s_init, seq_lens = chop_into_sequences(
+            eps_ids, agent_ids, f, s, 4, dynamic_max=False)
+        self.assertEqual(seq_lens.tolist(), [2, 1, 2, 2, 1])
+        self.assertEqual(len(f_pad[0]), 20)
+        self.assertEqual(len(s_init[0]), 5)
+
     def testDynamicMaxLen(self):
         eps_ids = [5, 2, 2]
+        agent_ids = [2, 2, 2]
         f = [[1, 1, 1]]
         s = [[1, 1, 1]]
-        f_pad, s_init, seq_lens = chop_into_sequences(eps_ids, f, s, 4)
+        f_pad, s_init, seq_lens = chop_into_sequences(eps_ids, agent_ids, f, s,
+                                                      4)
         self.assertEqual([f.tolist() for f in f_pad], [[1, 0, 1, 1]])
         self.assertEqual([s.tolist() for s in s_init], [[1, 1]])
         self.assertEqual(seq_lens.tolist(), [1, 2])
diff --git a/python/ray/rllib/test/test_multi_agent_env.py b/python/ray/rllib/test/test_multi_agent_env.py
index 96eaabaf1dff2..1fdfa5d74ae8a 100644
--- a/python/ray/rllib/test/test_multi_agent_env.py
+++ b/python/ray/rllib/test/test_multi_agent_env.py
@@ -15,12 +15,19 @@
 from ray.rllib.test.test_policy_evaluator import MockEnv, MockEnv2, \
     MockPolicyGraph
 from ray.rllib.evaluation.policy_evaluator import PolicyEvaluator
+from ray.rllib.evaluation.policy_graph import PolicyGraph
 from ray.rllib.evaluation.metrics import collect_metrics
 from ray.rllib.env.async_vector_env import _MultiAgentEnvToAsync
 from ray.rllib.env.multi_agent_env import MultiAgentEnv
 from ray.tune.registry import register_env
 
 
+def one_hot(i, n):
+    out = [0.0] * n
+    out[i] = 1.0
+    return out
+
+
 class BasicMultiAgent(MultiAgentEnv):
     """Env of N independent agents, each of which exits after 25 steps."""
 
@@ -63,7 +70,7 @@ def __init__(self, num, increment_obs=False):
         self.last_info = {}
         self.i = 0
         self.num = num
-        self.observation_space = gym.spaces.Discrete(2)
+        self.observation_space = gym.spaces.Discrete(10)
         self.action_space = gym.spaces.Discrete(2)
 
     def reset(self):
@@ -99,25 +106,32 @@ def step(self, action_dict):
         return obs, rew, done, info
 
 
-class MultiCartpole(MultiAgentEnv):
-    def __init__(self, num):
-        self.agents = [gym.make("CartPole-v0") for _ in range(num)]
-        self.dones = set()
-        self.observation_space = self.agents[0].observation_space
-        self.action_space = self.agents[0].action_space
+def make_multiagent(env_name):
+    class MultiEnv(MultiAgentEnv):
+        def __init__(self, num):
+            self.agents = [gym.make(env_name) for _ in range(num)]
+            self.dones = set()
+            self.observation_space = self.agents[0].observation_space
+            self.action_space = self.agents[0].action_space
 
-    def reset(self):
-        self.dones = set()
-        return {i: a.reset() for i, a in enumerate(self.agents)}
+        def reset(self):
+            self.dones = set()
+            return {i: a.reset() for i, a in enumerate(self.agents)}
 
-    def step(self, action_dict):
-        obs, rew, done, info = {}, {}, {}, {}
-        for i, action in action_dict.items():
-            obs[i], rew[i], done[i], info[i] = self.agents[i].step(action)
-            if done[i]:
-                self.dones.add(i)
-        done["__all__"] = len(self.dones) == len(self.agents)
-        return obs, rew, done, info
+        def step(self, action_dict):
+            obs, rew, done, info = {}, {}, {}, {}
+            for i, action in action_dict.items():
+                obs[i], rew[i], done[i], info[i] = self.agents[i].step(action)
+                if done[i]:
+                    self.dones.add(i)
+            done["__all__"] = len(self.dones) == len(self.agents)
+            return obs, rew, done, info
+
+    return MultiEnv
+
+
+MultiCartpole = make_multiagent("CartPole-v0")
+MultiMountainCar = make_multiagent("MountainCarContinuous-v0")
 
 
 class TestMultiAgentEnv(unittest.TestCase):
@@ -282,7 +296,7 @@ def testMultiAgentSampleWithHorizon(self):
 
     def testMultiAgentSampleRoundRobin(self):
         act_space = gym.spaces.Discrete(2)
-        obs_space = gym.spaces.Discrete(2)
+        obs_space = gym.spaces.Discrete(10)
         ev = PolicyEvaluator(
             env_creator=lambda _: RoundRobinMultiAgent(5, increment_obs=True),
             policy_graph={
@@ -295,10 +309,20 @@ def testMultiAgentSampleRoundRobin(self):
         # since we round robin introduce agents into the env, some of the env
         # steps don't count as proper transitions
         self.assertEqual(batch.policy_batches["p0"].count, 42)
-        self.assertEqual(batch.policy_batches["p0"]["obs"].tolist()[:10],
-                         [0, 1, 2, 3, 4] * 2)
-        self.assertEqual(batch.policy_batches["p0"]["new_obs"].tolist()[:10],
-                         [1, 2, 3, 4, 5] * 2)
+        self.assertEqual(batch.policy_batches["p0"]["obs"].tolist()[:10], [
+            one_hot(0, 10),
+            one_hot(1, 10),
+            one_hot(2, 10),
+            one_hot(3, 10),
+            one_hot(4, 10),
+        ] * 2)
+        self.assertEqual(batch.policy_batches["p0"]["new_obs"].tolist()[:10], [
+            one_hot(1, 10),
+            one_hot(2, 10),
+            one_hot(3, 10),
+            one_hot(4, 10),
+            one_hot(5, 10),
+        ] * 2)
         self.assertEqual(batch.policy_batches["p0"]["rewards"].tolist()[:10],
                          [100, 100, 100, 100, 0] * 2)
         self.assertEqual(batch.policy_batches["p0"]["dones"].tolist()[:10],
@@ -306,12 +330,39 @@ def testMultiAgentSampleRoundRobin(self):
         self.assertEqual(batch.policy_batches["p0"]["t"].tolist()[:10],
                          [4, 9, 14, 19, 24, 5, 10, 15, 20, 25])
 
+    def testCustomRNNStateValues(self):
+        h = {"some": {"arbitrary": "structure", "here": [1, 2, 3]}}
+
+        class StatefulPolicyGraph(PolicyGraph):
+            def compute_actions(self,
+                                obs_batch,
+                                state_batches,
+                                prev_action_batch=None,
+                                prev_reward_batch=None,
+                                episodes=None):
+                return [0] * len(obs_batch), [[h] * len(obs_batch)], {}
+
+            def get_initial_state(self):
+                return [{}]  # empty dict
+
+        ev = PolicyEvaluator(
+            env_creator=lambda _: gym.make("CartPole-v0"),
+            policy_graph=StatefulPolicyGraph,
+            batch_steps=5)
+        batch = ev.sample()
+        self.assertEqual(batch.count, 5)
+        self.assertEqual(batch["state_in_0"][0], {})
+        self.assertEqual(batch["state_out_0"][0], h)
+        self.assertEqual(batch["state_in_0"][1], h)
+        self.assertEqual(batch["state_out_0"][1], h)
+
     def testReturningModelBasedRolloutsData(self):
         class ModelBasedPolicyGraph(PGPolicyGraph):
             def compute_actions(self,
                                 obs_batch,
                                 state_batches,
-                                is_training=False,
+                                prev_action_batch=None,
+                                prev_reward_batch=None,
                                 episodes=None):
                 # Pretend we did a model-based rollout and want to return
                 # the extra trajectory.
@@ -329,7 +380,7 @@ def compute_actions(self,
                         dones=t == 4,
                         infos={},
                         new_obs=obs_batch[0])
-                batch = builder.build_and_reset()
+                batch = builder.build_and_reset(episode=None)
                 episodes[0].add_extra_batch(batch)
 
                 # Just return zeros for actions
diff --git a/python/ray/rllib/test/test_nested_spaces.py b/python/ray/rllib/test/test_nested_spaces.py
new file mode 100644
index 0000000000000..95744b7e278af
--- /dev/null
+++ b/python/ray/rllib/test/test_nested_spaces.py
@@ -0,0 +1,346 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import pickle
+
+from gym import spaces
+from gym.envs.registration import EnvSpec
+import gym
+import tensorflow.contrib.slim as slim
+import tensorflow as tf
+import unittest
+
+import ray
+from ray.rllib.agents.pg import PGAgent
+from ray.rllib.agents.pg.pg_policy_graph import PGPolicyGraph
+from ray.rllib.env import MultiAgentEnv
+from ray.rllib.env.async_vector_env import AsyncVectorEnv
+from ray.rllib.env.vector_env import VectorEnv
+from ray.rllib.models import ModelCatalog
+from ray.rllib.models.model import Model
+from ray.rllib.test.test_external_env import SimpleServing
+from ray.tune.registry import register_env
+
+DICT_SPACE = spaces.Dict({
+    "sensors": spaces.Dict({
+        "position": spaces.Box(low=-100, high=100, shape=(3, )),
+        "velocity": spaces.Box(low=-1, high=1, shape=(3, )),
+        "front_cam": spaces.Tuple(
+            (spaces.Box(low=0, high=1, shape=(10, 10, 3)),
+             spaces.Box(low=0, high=1, shape=(10, 10, 3)))),
+        "rear_cam": spaces.Box(low=0, high=1, shape=(10, 10, 3)),
+    }),
+    "inner_state": spaces.Dict({
+        "charge": spaces.Discrete(100),
+        "job_status": spaces.Dict({
+            "task": spaces.Discrete(5),
+            "progress": spaces.Box(low=0, high=100, shape=()),
+        })
+    })
+})
+
+DICT_SAMPLES = [DICT_SPACE.sample() for _ in range(10)]
+
+TUPLE_SPACE = spaces.Tuple([
+    spaces.Box(low=-100, high=100, shape=(3, )),
+    spaces.Tuple((spaces.Box(low=0, high=1, shape=(10, 10, 3)),
+                  spaces.Box(low=0, high=1, shape=(10, 10, 3)))),
+    spaces.Discrete(5),
+])
+
+TUPLE_SAMPLES = [TUPLE_SPACE.sample() for _ in range(10)]
+
+
+def one_hot(i, n):
+    out = [0.0] * n
+    out[i] = 1.0
+    return out
+
+
+class NestedDictEnv(gym.Env):
+    def __init__(self):
+        self.action_space = spaces.Discrete(2)
+        self.observation_space = DICT_SPACE
+        self._spec = EnvSpec("NestedDictEnv-v0")
+        self.steps = 0
+
+    def reset(self):
+        self.steps = 0
+        return DICT_SAMPLES[0]
+
+    def step(self, action):
+        self.steps += 1
+        return DICT_SAMPLES[self.steps], 1, self.steps >= 5, {}
+
+
+class NestedTupleEnv(gym.Env):
+    def __init__(self):
+        self.action_space = spaces.Discrete(2)
+        self.observation_space = TUPLE_SPACE
+        self._spec = EnvSpec("NestedTupleEnv-v0")
+        self.steps = 0
+
+    def reset(self):
+        self.steps = 0
+        return TUPLE_SAMPLES[0]
+
+    def step(self, action):
+        self.steps += 1
+        return TUPLE_SAMPLES[self.steps], 1, self.steps >= 5, {}
+
+
+class NestedMultiAgentEnv(MultiAgentEnv):
+    def __init__(self):
+        self.steps = 0
+
+    def reset(self):
+        return {
+            "dict_agent": DICT_SAMPLES[0],
+            "tuple_agent": TUPLE_SAMPLES[0],
+        }
+
+    def step(self, actions):
+        self.steps += 1
+        obs = {
+            "dict_agent": DICT_SAMPLES[self.steps],
+            "tuple_agent": TUPLE_SAMPLES[self.steps],
+        }
+        rew = {
+            "dict_agent": 0,
+            "tuple_agent": 0,
+        }
+        dones = {"__all__": self.steps >= 5}
+        infos = {
+            "dict_agent": {},
+            "tuple_agent": {},
+        }
+        return obs, rew, dones, infos
+
+
+class InvalidModel(Model):
+    def _build_layers_v2(self, input_dict, num_outputs, options):
+        return "not", "valid"
+
+
+class InvalidModel2(Model):
+    def _build_layers_v2(self, input_dict, num_outputs, options):
+        return tf.constant(0), tf.constant(0)
+
+
+class DictSpyModel(Model):
+    capture_index = 0
+
+    def _build_layers_v2(self, input_dict, num_outputs, options):
+        def spy(pos, front_cam, task):
+            # TF runs this function in an isolated context, so we have to use
+            # redis to communicate back to our suite
+            ray.experimental.internal_kv._internal_kv_put(
+                "d_spy_in_{}".format(DictSpyModel.capture_index),
+                pickle.dumps((pos, front_cam, task)),
+                overwrite=True)
+            DictSpyModel.capture_index += 1
+            return 0
+
+        spy_fn = tf.py_func(
+            spy, [
+                input_dict["obs"]["sensors"]["position"],
+                input_dict["obs"]["sensors"]["front_cam"][0],
+                input_dict["obs"]["inner_state"]["job_status"]["task"]
+            ],
+            tf.int64,
+            stateful=True)
+
+        with tf.control_dependencies([spy_fn]):
+            output = slim.fully_connected(
+                input_dict["obs"]["sensors"]["position"], num_outputs)
+        return output, output
+
+
+class TupleSpyModel(Model):
+    capture_index = 0
+
+    def _build_layers_v2(self, input_dict, num_outputs, options):
+        def spy(pos, cam, task):
+            # TF runs this function in an isolated context, so we have to use
+            # redis to communicate back to our suite
+            ray.experimental.internal_kv._internal_kv_put(
+                "t_spy_in_{}".format(TupleSpyModel.capture_index),
+                pickle.dumps((pos, cam, task)),
+                overwrite=True)
+            TupleSpyModel.capture_index += 1
+            return 0
+
+        spy_fn = tf.py_func(
+            spy, [
+                input_dict["obs"][0],
+                input_dict["obs"][1][0],
+                input_dict["obs"][2],
+            ],
+            tf.int64,
+            stateful=True)
+
+        with tf.control_dependencies([spy_fn]):
+            output = slim.fully_connected(input_dict["obs"][0], num_outputs)
+        return output, output
+
+
+class NestedSpacesTest(unittest.TestCase):
+    def testInvalidModel(self):
+        ModelCatalog.register_custom_model("invalid", InvalidModel)
+        self.assertRaises(ValueError, lambda: PGAgent(
+            env="CartPole-v0", config={
+                "model": {
+                    "custom_model": "invalid",
+                },
+            }))
+
+    def testInvalidModel2(self):
+        ModelCatalog.register_custom_model("invalid2", InvalidModel2)
+        self.assertRaisesRegexp(
+            ValueError, "Expected output.*",
+            lambda: PGAgent(
+                env="CartPole-v0", config={
+                    "model": {
+                        "custom_model": "invalid2",
+                    },
+                }))
+
+    def doTestNestedDict(self, make_env, test_lstm=False):
+        ModelCatalog.register_custom_model("composite", DictSpyModel)
+        register_env("nested", make_env)
+        pg = PGAgent(
+            env="nested",
+            config={
+                "num_workers": 0,
+                "sample_batch_size": 5,
+                "model": {
+                    "custom_model": "composite",
+                    "use_lstm": test_lstm,
+                },
+            })
+        pg.train()
+
+        # Check that the model sees the correct reconstructed observations
+        for i in range(4):
+            seen = pickle.loads(
+                ray.experimental.internal_kv._internal_kv_get(
+                    "d_spy_in_{}".format(i)))
+            pos_i = DICT_SAMPLES[i]["sensors"]["position"].tolist()
+            cam_i = DICT_SAMPLES[i]["sensors"]["front_cam"][0].tolist()
+            task_i = one_hot(
+                DICT_SAMPLES[i]["inner_state"]["job_status"]["task"], 5)
+            self.assertEqual(seen[0][0].tolist(), pos_i)
+            self.assertEqual(seen[1][0].tolist(), cam_i)
+            self.assertEqual(seen[2][0].tolist(), task_i)
+
+    def doTestNestedTuple(self, make_env):
+        ModelCatalog.register_custom_model("composite2", TupleSpyModel)
+        register_env("nested2", make_env)
+        pg = PGAgent(
+            env="nested2",
+            config={
+                "num_workers": 0,
+                "sample_batch_size": 5,
+                "model": {
+                    "custom_model": "composite2",
+                },
+            })
+        pg.train()
+
+        # Check that the model sees the correct reconstructed observations
+        for i in range(4):
+            seen = pickle.loads(
+                ray.experimental.internal_kv._internal_kv_get(
+                    "t_spy_in_{}".format(i)))
+            pos_i = TUPLE_SAMPLES[i][0].tolist()
+            cam_i = TUPLE_SAMPLES[i][1][0].tolist()
+            task_i = one_hot(TUPLE_SAMPLES[i][2], 5)
+            self.assertEqual(seen[0][0].tolist(), pos_i)
+            self.assertEqual(seen[1][0].tolist(), cam_i)
+            self.assertEqual(seen[2][0].tolist(), task_i)
+
+    def testNestedDictGym(self):
+        self.doTestNestedDict(lambda _: NestedDictEnv())
+
+    def testNestedDictGymLSTM(self):
+        self.doTestNestedDict(lambda _: NestedDictEnv(), test_lstm=True)
+
+    def testNestedDictVector(self):
+        self.doTestNestedDict(
+            lambda _: VectorEnv.wrap(lambda i: NestedDictEnv()))
+
+    def testNestedDictServing(self):
+        self.doTestNestedDict(lambda _: SimpleServing(NestedDictEnv()))
+
+    def testNestedDictAsync(self):
+        self.doTestNestedDict(
+            lambda _: AsyncVectorEnv.wrap_async(NestedDictEnv()))
+
+    def testNestedTupleGym(self):
+        self.doTestNestedTuple(lambda _: NestedTupleEnv())
+
+    def testNestedTupleVector(self):
+        self.doTestNestedTuple(
+            lambda _: VectorEnv.wrap(lambda i: NestedTupleEnv()))
+
+    def testNestedTupleServing(self):
+        self.doTestNestedTuple(lambda _: SimpleServing(NestedTupleEnv()))
+
+    def testNestedTupleAsync(self):
+        self.doTestNestedTuple(
+            lambda _: AsyncVectorEnv.wrap_async(NestedTupleEnv()))
+
+    def testMultiAgentComplexSpaces(self):
+        ModelCatalog.register_custom_model("dict_spy", DictSpyModel)
+        ModelCatalog.register_custom_model("tuple_spy", TupleSpyModel)
+        register_env("nested_ma", lambda _: NestedMultiAgentEnv())
+        act_space = spaces.Discrete(2)
+        pg = PGAgent(
+            env="nested_ma",
+            config={
+                "num_workers": 0,
+                "sample_batch_size": 5,
+                "multiagent": {
+                    "policy_graphs": {
+                        "tuple_policy": (
+                            PGPolicyGraph, TUPLE_SPACE, act_space,
+                            {"model": {"custom_model": "tuple_spy"}}),
+                        "dict_policy": (
+                            PGPolicyGraph, DICT_SPACE, act_space,
+                            {"model": {"custom_model": "dict_spy"}}),
+                    },
+                    "policy_mapping_fn": lambda a: {
+                        "tuple_agent": "tuple_policy",
+                        "dict_agent": "dict_policy"}[a],
+                },
+            })
+        pg.train()
+
+        for i in range(4):
+            seen = pickle.loads(
+                ray.experimental.internal_kv._internal_kv_get(
+                    "d_spy_in_{}".format(i)))
+            pos_i = DICT_SAMPLES[i]["sensors"]["position"].tolist()
+            cam_i = DICT_SAMPLES[i]["sensors"]["front_cam"][0].tolist()
+            task_i = one_hot(
+                DICT_SAMPLES[i]["inner_state"]["job_status"]["task"], 5)
+            self.assertEqual(seen[0][0].tolist(), pos_i)
+            self.assertEqual(seen[1][0].tolist(), cam_i)
+            self.assertEqual(seen[2][0].tolist(), task_i)
+
+        for i in range(4):
+            seen = pickle.loads(
+                ray.experimental.internal_kv._internal_kv_get(
+                    "t_spy_in_{}".format(i)))
+            pos_i = TUPLE_SAMPLES[i][0].tolist()
+            cam_i = TUPLE_SAMPLES[i][1][0].tolist()
+            task_i = one_hot(TUPLE_SAMPLES[i][2], 5)
+            self.assertEqual(seen[0][0].tolist(), pos_i)
+            self.assertEqual(seen[1][0].tolist(), cam_i)
+            self.assertEqual(seen[2][0].tolist(), task_i)
+
+
+if __name__ == "__main__":
+    ray.init(num_cpus=5)
+    unittest.main(verbosity=2)
diff --git a/python/ray/rllib/test/test_policy_evaluator.py b/python/ray/rllib/test/test_policy_evaluator.py
index cc189edbf6e0c..cf319a7e922b2 100644
--- a/python/ray/rllib/test/test_policy_evaluator.py
+++ b/python/ray/rllib/test/test_policy_evaluator.py
@@ -3,8 +3,10 @@
 from __future__ import print_function
 
 import gym
+import numpy as np
 import time
 import unittest
+from collections import Counter
 
 import ray
 from ray.rllib.agents.pg import PGAgent
@@ -21,11 +23,16 @@ class MockPolicyGraph(PolicyGraph):
     def compute_actions(self,
                         obs_batch,
                         state_batches,
-                        is_training=False,
+                        prev_action_batch=None,
+                        prev_reward_batch=None,
                         episodes=None):
         return [0] * len(obs_batch), [], {}
 
-    def postprocess_trajectory(self, batch, other_agent_batches=None):
+    def postprocess_trajectory(self,
+                               batch,
+                               other_agent_batches=None,
+                               episode=None):
+        assert episode is not None
         return compute_advantages(batch, 100.0, 0.9, use_gae=False)
 
 
@@ -33,14 +40,31 @@ class BadPolicyGraph(PolicyGraph):
     def compute_actions(self,
                         obs_batch,
                         state_batches,
-                        is_training=False,
+                        prev_action_batch=None,
+                        prev_reward_batch=None,
                         episodes=None):
         raise Exception("intentional error")
 
-    def postprocess_trajectory(self, batch, other_agent_batches=None):
+    def postprocess_trajectory(self,
+                               batch,
+                               other_agent_batches=None,
+                               episode=None):
+        assert episode is not None
         return compute_advantages(batch, 100.0, 0.9, use_gae=False)
 
 
+class FailOnStepEnv(gym.Env):
+    def __init__(self):
+        self.observation_space = gym.spaces.Discrete(1)
+        self.action_space = gym.spaces.Discrete(2)
+
+    def reset(self):
+        raise ValueError("kaboom")
+
+    def step(self, action):
+        raise ValueError("kaboom")
+
+
 class MockEnv(gym.Env):
     def __init__(self, episode_length, config=None):
         self.episode_length = episode_length
@@ -107,10 +131,39 @@ def testBasic(self):
             env_creator=lambda _: gym.make("CartPole-v0"),
             policy_graph=MockPolicyGraph)
         batch = ev.sample()
-        for key in ["obs", "actions", "rewards", "dones", "advantages"]:
+        for key in [
+                "obs", "actions", "rewards", "dones", "advantages",
+                "prev_rewards", "prev_actions"
+        ]:
             self.assertIn(key, batch)
+
+        def to_prev(vec):
+            out = np.zeros_like(vec)
+            for i, v in enumerate(vec):
+                if i + 1 < len(out) and not batch["dones"][i]:
+                    out[i + 1] = v
+            return out.tolist()
+
+        self.assertEqual(batch["prev_rewards"].tolist(),
+                         to_prev(batch["rewards"]))
+        self.assertEqual(batch["prev_actions"].tolist(),
+                         to_prev(batch["actions"]))
         self.assertGreater(batch["advantages"][0], 1)
 
+    # 11/23/18: Samples per second 8501.125113727468
+    def testBaselinePerformance(self):
+        ev = PolicyEvaluator(
+            env_creator=lambda _: gym.make("CartPole-v0"),
+            policy_graph=MockPolicyGraph,
+            batch_steps=100)
+        start = time.time()
+        count = 0
+        while time.time() - start < 1:
+            count += ev.sample().count
+        print()
+        print("Samples per second {}".format(count / (time.time() - start)))
+        print()
+
     def testGlobalVarsUpdate(self):
         agent = A2CAgent(
             env="CartPole-v0",
@@ -122,6 +175,34 @@ def testGlobalVarsUpdate(self):
         result2 = agent.train()
         self.assertLess(result2["info"]["learner"]["cur_lr"], 0.0001)
 
+    def testNoStepOnInit(self):
+        register_env("fail", lambda _: FailOnStepEnv())
+        pg = PGAgent(env="fail", config={"num_workers": 1})
+        self.assertRaises(Exception, lambda: pg.train())
+
+    def testCallbacks(self):
+        counts = Counter()
+        pg = PGAgent(
+            env="CartPole-v0", config={
+                "num_workers": 0,
+                "sample_batch_size": 50,
+                "callbacks": {
+                    "on_episode_start": lambda x: counts.update({"start": 1}),
+                    "on_episode_step": lambda x: counts.update({"step": 1}),
+                    "on_episode_end": lambda x: counts.update({"end": 1}),
+                    "on_sample_end": lambda x: counts.update({"sample": 1}),
+                },
+            })
+        pg.train()
+        pg.train()
+        pg.train()
+        pg.train()
+        self.assertEqual(counts["sample"], 4)
+        self.assertGreater(counts["start"], 0)
+        self.assertGreater(counts["end"], 0)
+        self.assertGreater(counts["step"], 200)
+        self.assertLess(counts["step"], 400)
+
     def testQueryEvaluators(self):
         register_env("test", lambda _: gym.make("CartPole-v0"))
         pg = PGAgent(
@@ -129,9 +210,10 @@ def testQueryEvaluators(self):
                 "num_workers": 2,
                 "sample_batch_size": 5
             })
-        results = pg.optimizer.foreach_evaluator(lambda ev: ev.batch_steps)
+        results = pg.optimizer.foreach_evaluator(
+            lambda ev: ev.sample_batch_size)
         results2 = pg.optimizer.foreach_evaluator_with_index(
-            lambda ev, i: (i, ev.batch_steps))
+            lambda ev, i: (i, ev.sample_batch_size))
         self.assertEqual(results, [5, 5, 5])
         self.assertEqual(results2, [(0, 5), (1, 5), (2, 5)])
 
@@ -198,7 +280,7 @@ def testAutoVectorization(self):
             env_creator=lambda cfg: MockEnv(episode_length=20, config=cfg),
             policy_graph=MockPolicyGraph,
             batch_mode="truncate_episodes",
-            batch_steps=16,
+            batch_steps=2,
             num_envs=8)
         for _ in range(8):
             batch = ev.sample()
@@ -216,21 +298,12 @@ def testAutoVectorization(self):
             indices.append(env.unwrapped.config.vector_index)
         self.assertEqual(indices, [0, 1, 2, 3, 4, 5, 6, 7])
 
-    def testBatchDivisibilityCheck(self):
-        self.assertRaises(
-            ValueError,
-            lambda: PolicyEvaluator(
-                env_creator=lambda _: MockEnv(episode_length=8),
-                policy_graph=MockPolicyGraph,
-                batch_mode="truncate_episodes",
-                batch_steps=15, num_envs=4))
-
-    def testBatchesSmallerWhenVectorized(self):
+    def testBatchesLargerWhenVectorized(self):
         ev = PolicyEvaluator(
             env_creator=lambda _: MockEnv(episode_length=8),
             policy_graph=MockPolicyGraph,
             batch_mode="truncate_episodes",
-            batch_steps=16,
+            batch_steps=4,
             num_envs=4)
         batch = ev.sample()
         self.assertEqual(batch.count, 16)
diff --git a/python/ray/rllib/test/test_rollout.sh b/python/ray/rllib/test/test_rollout.sh
new file mode 100755
index 0000000000000..04685b2be345d
--- /dev/null
+++ b/python/ray/rllib/test/test_rollout.sh
@@ -0,0 +1,28 @@
+#!/bin/bash -e
+
+TRAIN=/ray/python/ray/rllib/train.py
+if [ ! -e "$TRAIN" ]; then
+    TRAIN=../train.py
+fi
+ROLLOUT=/ray/python/ray/rllib/rollout.py
+if [ ! -e "$ROLLOUT" ]; then
+    ROLLOUT=../rollout.py
+fi
+
+TMP=`mktemp -d`
+echo "Saving results to $TMP"
+
+$TRAIN --local-dir=$TMP --run=IMPALA --checkpoint-freq=1 \
+    --config='{"num_workers": 1, "num_gpus": 0}' --env=Pong-ram-v4 \
+    --stop='{"training_iteration": 1}'
+find $TMP
+
+CHECKPOINT_PATH=`ls $TMP/default/*/checkpoint_1/checkpoint-1`
+echo "Checkpoint path $CHECKPOINT_PATH"
+test -e "$CHECKPOINT_PATH"
+
+$ROLLOUT --run=IMPALA "$CHECKPOINT_PATH" --steps=100 \
+    --out="$TMP/rollouts.pkl" --no-render
+test -e "$TMP/rollouts.pkl"
+rm -rf "$TMP"
+echo "OK"
diff --git a/python/ray/rllib/test/test_supported_spaces.py b/python/ray/rllib/test/test_supported_spaces.py
index 2ced3402a78a6..2e5b74b536f90 100644
--- a/python/ray/rllib/test/test_supported_spaces.py
+++ b/python/ray/rllib/test/test_supported_spaces.py
@@ -2,49 +2,41 @@
 import traceback
 
 import gym
-from gym.spaces import Box, Discrete, Tuple
+from gym.spaces import Box, Discrete, Tuple, Dict
 from gym.envs.registration import EnvSpec
 import numpy as np
 import sys
 
 import ray
 from ray.rllib.agents.agent import get_agent_class
+from ray.rllib.test.test_multi_agent_env import MultiCartpole, MultiMountainCar
 from ray.rllib.utils.error import UnsupportedSpaceException
 from ray.tune.registry import register_env
 
 ACTION_SPACES_TO_TEST = {
     "discrete": Discrete(5),
-    "vector": Box(0.0, 1.0, (5, ), dtype=np.float32),
-    "simple_tuple": Tuple([
-        Box(0.0, 1.0, (5, ), dtype=np.float32),
-        Box(0.0, 1.0, (5, ), dtype=np.float32)
-    ]),
-    "implicit_tuple": [
-        Box(0.0, 1.0, (5, ), dtype=np.float32),
-        Box(0.0, 1.0, (5, ), dtype=np.float32)
-    ],
-    "mixed_tuple": Tuple(
+    "vector": Box(-1.0, 1.0, (5, ), dtype=np.float32),
+    "tuple": Tuple(
         [Discrete(2),
          Discrete(3),
-         Box(0.0, 1.0, (5, ), dtype=np.float32)]),
+         Box(-1.0, 1.0, (5, ), dtype=np.float32)]),
 }
 
 OBSERVATION_SPACES_TO_TEST = {
     "discrete": Discrete(5),
-    "vector": Box(0.0, 1.0, (5, ), dtype=np.float32),
-    "image": Box(0.0, 1.0, (84, 84, 1), dtype=np.float32),
-    "atari": Box(0.0, 1.0, (210, 160, 3), dtype=np.float32),
-    "atari_ram": Box(0.0, 1.0, (128, ), dtype=np.float32),
-    "simple_tuple": Tuple([
-        Box(0.0, 1.0, (5, ), dtype=np.float32),
-        Box(0.0, 1.0, (5, ), dtype=np.float32)
-    ]),
-    "mixed_tuple": Tuple(
-        [Discrete(10), Box(0.0, 1.0, (5, ), dtype=np.float32)]),
+    "vector": Box(-1.0, 1.0, (5, ), dtype=np.float32),
+    "image": Box(-1.0, 1.0, (84, 84, 1), dtype=np.float32),
+    "atari": Box(-1.0, 1.0, (210, 160, 3), dtype=np.float32),
+    "tuple": Tuple([Discrete(10),
+                    Box(-1.0, 1.0, (5, ), dtype=np.float32)]),
+    "dict": Dict({
+        "task": Discrete(10),
+        "position": Box(-1.0, 1.0, (5, ), dtype=np.float32),
+    }),
 }
 
 
-def make_stub_env(action_space, obs_space):
+def make_stub_env(action_space, obs_space, check_action_bounds):
     class StubEnv(gym.Env):
         def __init__(self):
             self.action_space = action_space
@@ -56,23 +48,30 @@ def reset(self):
             return sample
 
         def step(self, action):
+            if check_action_bounds and not self.action_space.contains(action):
+                raise ValueError("Illegal action for {}: {}".format(
+                    self.action_space, action))
+            if (isinstance(self.action_space, Tuple)
+                    and len(action) != len(self.action_space.spaces)):
+                raise ValueError("Illegal action for {}: {}".format(
+                    self.action_space, action))
             return self.observation_space.sample(), 1, True, {}
 
     return StubEnv
 
 
-def check_support(alg, config, stats):
+def check_support(alg, config, stats, check_bounds=False):
     for a_name, action_space in ACTION_SPACES_TO_TEST.items():
         for o_name, obs_space in OBSERVATION_SPACES_TO_TEST.items():
             print("=== Testing", alg, action_space, obs_space, "===")
-            stub_env = make_stub_env(action_space, obs_space)
+            stub_env = make_stub_env(action_space, obs_space, check_bounds)
             register_env("stub_env", lambda c: stub_env())
             stat = "ok"
             a = None
             try:
                 a = get_agent_class(alg)(config=config, env="stub_env")
                 a.train()
-            except UnsupportedSpaceException as e:
+            except UnsupportedSpaceException:
                 stat = "unsupported"
             except Exception as e:
                 stat = "ERROR"
@@ -90,27 +89,56 @@ def check_support(alg, config, stats):
             stats[alg, a_name, o_name] = stat
 
 
+def check_support_multiagent(alg, config):
+    register_env("multi_mountaincar", lambda _: MultiMountainCar(2))
+    register_env("multi_cartpole", lambda _: MultiCartpole(2))
+    if alg == "DDPG":
+        a = get_agent_class(alg)(config=config, env="multi_mountaincar")
+    else:
+        a = get_agent_class(alg)(config=config, env="multi_cartpole")
+    try:
+        a.train()
+    finally:
+        a.stop()
+
+
 class ModelSupportedSpaces(unittest.TestCase):
+    def setUp(self):
+        ray.init(num_cpus=4)
+
+    def tearDown(self):
+        ray.shutdown()
+
     def testAll(self):
-        ray.init()
         stats = {}
-        check_support("IMPALA", {"gpu": False}, stats)
-        check_support("DDPG", {"timesteps_per_iteration": 1}, stats)
+        check_support("IMPALA", {"num_gpus": 0}, stats)
+        check_support(
+            "DDPG", {
+                "noise_scale": 100.0,
+                "timesteps_per_iteration": 1
+            },
+            stats,
+            check_bounds=True)
         check_support("DQN", {"timesteps_per_iteration": 1}, stats)
-        check_support("A3C", {
-            "num_workers": 1,
-            "optimizer": {
-                "grads_per_step": 1
-            }
-        }, stats)
+        check_support(
+            "A3C", {
+                "num_workers": 1,
+                "optimizer": {
+                    "grads_per_step": 1
+                }
+            },
+            stats,
+            check_bounds=True)
         check_support(
             "PPO", {
                 "num_workers": 1,
                 "num_sgd_iter": 1,
                 "train_batch_size": 10,
                 "sample_batch_size": 10,
-                "sgd_minibatch_size": 1
-            }, stats)
+                "sgd_minibatch_size": 1,
+            },
+            stats,
+            check_bounds=True)
         check_support(
             "ES", {
                 "num_workers": 1,
@@ -125,7 +153,13 @@ def testAll(self):
                 "num_rollouts": 1,
                 "rollouts_used": 1
             }, stats)
-        check_support("PG", {"num_workers": 1, "optimizer": {}}, stats)
+        check_support(
+            "PG", {
+                "num_workers": 1,
+                "optimizer": {}
+            },
+            stats,
+            check_bounds=True)
         num_unexpected_errors = 0
         for (alg, a_name, o_name), stat in sorted(stats.items()):
             if stat not in ["ok", "unsupported"]:
@@ -134,6 +168,26 @@ def testAll(self):
                   stat)
         self.assertEqual(num_unexpected_errors, 0)
 
+    def testMultiAgent(self):
+        check_support_multiagent("IMPALA", {"num_gpus": 0})
+        check_support_multiagent("DQN", {"timesteps_per_iteration": 1})
+        check_support_multiagent("A3C", {
+            "num_workers": 1,
+            "optimizer": {
+                "grads_per_step": 1
+            }
+        })
+        check_support_multiagent(
+            "PPO", {
+                "num_workers": 1,
+                "num_sgd_iter": 1,
+                "train_batch_size": 10,
+                "sample_batch_size": 10,
+                "sgd_minibatch_size": 1,
+            })
+        check_support_multiagent("PG", {"num_workers": 1, "optimizer": {}})
+        check_support_multiagent("DDPG", {"timesteps_per_iteration": 1})
+
 
 if __name__ == "__main__":
     if len(sys.argv) > 1 and sys.argv[1] == "--smoke":
diff --git a/python/ray/rllib/train.py b/python/ray/rllib/train.py
index b9e7b72efd673..72d6fc0b58c3d 100755
--- a/python/ray/rllib/train.py
+++ b/python/ray/rllib/train.py
@@ -8,6 +8,7 @@
 import yaml
 
 import ray
+from ray.test.cluster_utils import Cluster
 from ray.tune.config_parser import make_parser, resources_to_json
 from ray.tune.tune import _make_scheduler, run_experiments
 
@@ -37,19 +38,33 @@ def create_parser(parser_creator=None):
         "--redis-address",
         default=None,
         type=str,
-        help="The Redis address of the cluster.")
+        help="Connect to an existing Ray cluster at this address instead "
+        "of starting a new one.")
     parser.add_argument(
         "--ray-num-cpus",
         default=None,
         type=int,
-        help="--num-cpus to pass to Ray."
-        " This only has an affect in local mode.")
+        help="--num-cpus to use if starting a new cluster.")
     parser.add_argument(
         "--ray-num-gpus",
         default=None,
         type=int,
-        help="--num-gpus to pass to Ray."
-        " This only has an affect in local mode.")
+        help="--num-gpus to use if starting a new cluster.")
+    parser.add_argument(
+        "--ray-num-local-schedulers",
+        default=None,
+        type=int,
+        help="Emulate multiple cluster nodes for debugging.")
+    parser.add_argument(
+        "--ray-redis-max-memory",
+        default=None,
+        type=int,
+        help="--redis-max-memory to use if starting a new cluster.")
+    parser.add_argument(
+        "--ray-object-store-memory",
+        default=None,
+        type=int,
+        help="--object-store-memory to use if starting a new cluster.")
     parser.add_argument(
         "--experiment-name",
         default="default",
@@ -102,10 +117,24 @@ def run(args, parser):
         if not exp.get("env") and not exp.get("config", {}).get("env"):
             parser.error("the following arguments are required: --env")
 
-    ray.init(
-        redis_address=args.redis_address,
-        num_cpus=args.ray_num_cpus,
-        num_gpus=args.ray_num_gpus)
+    if args.ray_num_local_schedulers:
+        cluster = Cluster()
+        for _ in range(args.ray_num_local_schedulers):
+            cluster.add_node(
+                resources={
+                    "num_cpus": args.ray_num_cpus or 1,
+                    "num_gpus": args.ray_num_gpus or 0,
+                },
+                object_store_memory=args.ray_object_store_memory,
+                redis_max_memory=args.ray_redis_max_memory)
+        ray.init(redis_address=cluster.redis_address)
+    else:
+        ray.init(
+            redis_address=args.redis_address,
+            object_store_memory=args.ray_object_store_memory,
+            redis_max_memory=args.ray_redis_max_memory,
+            num_cpus=args.ray_num_cpus,
+            num_gpus=args.ray_num_gpus)
     run_experiments(
         experiments,
         scheduler=_make_scheduler(args),
diff --git a/python/ray/rllib/tuned_examples/atari-a2c.yaml b/python/ray/rllib/tuned_examples/atari-a2c.yaml
index 89feaee5ba8b6..42ea119638e62 100644
--- a/python/ray/rllib/tuned_examples/atari-a2c.yaml
+++ b/python/ray/rllib/tuned_examples/atari-a2c.yaml
@@ -9,11 +9,11 @@ atari-a2c:
             - SpaceInvadersNoFrameskip-v4
     run: A2C
     config:
-        sample_batch_size: 100
+        sample_batch_size: 20
         clip_rewards: True
         num_workers: 5
         num_envs_per_worker: 5
-        gpu: true
+        num_gpus: 1
         lr_schedule: [
             [0, 0.0007],
             [20000000, 0.000000000001],
diff --git a/python/ray/rllib/tuned_examples/atari-apex.yaml b/python/ray/rllib/tuned_examples/atari-apex.yaml
index 6e538d038998a..e24e347dd18aa 100644
--- a/python/ray/rllib/tuned_examples/atari-apex.yaml
+++ b/python/ray/rllib/tuned_examples/atari-apex.yaml
@@ -23,12 +23,12 @@ apex:
         prioritized_replay_alpha: 0.5
         beta_annealing_fraction: 1.0
         final_prioritized_replay_beta: 1.0
-        gpu: false
+        num_gpus: 1
 
         # APEX
         num_workers: 8
         num_envs_per_worker: 8
-        sample_batch_size: 158
+        sample_batch_size: 20
         train_batch_size: 512
         target_network_update_freq: 50000
         timesteps_per_iteration: 25000
diff --git a/python/ray/rllib/tuned_examples/atari-dist-dqn.yaml b/python/ray/rllib/tuned_examples/atari-dist-dqn.yaml
index d719329861e88..d351e403f2e23 100644
--- a/python/ray/rllib/tuned_examples/atari-dist-dqn.yaml
+++ b/python/ray/rllib/tuned_examples/atari-dist-dqn.yaml
@@ -27,5 +27,5 @@ basic-dqn:
         prioritized_replay_alpha: 0.5
         beta_annealing_fraction: 1.0
         final_prioritized_replay_beta: 1.0
-        gpu: true
+        num_gpus: 0.2
         timesteps_per_iteration: 10000
diff --git a/python/ray/rllib/tuned_examples/atari-dqn.yaml b/python/ray/rllib/tuned_examples/atari-dqn.yaml
index 4929017879c97..b8731bb054ef3 100644
--- a/python/ray/rllib/tuned_examples/atari-dqn.yaml
+++ b/python/ray/rllib/tuned_examples/atari-dqn.yaml
@@ -1,4 +1,4 @@
-# Runs on a single g3.16xl node
+# Runs on a single g3.4xl node
 # See https://github.com/ray-project/rl-experiments for results
 atari-basic-dqn:
     env:
@@ -29,5 +29,5 @@ atari-basic-dqn:
         prioritized_replay_alpha: 0.5
         beta_annealing_fraction: 1.0
         final_prioritized_replay_beta: 1.0
-        gpu: true
+        num_gpus: 0.2
         timesteps_per_iteration: 10000
diff --git a/python/ray/rllib/tuned_examples/atari-duel-ddqn.yaml b/python/ray/rllib/tuned_examples/atari-duel-ddqn.yaml
index 61ed3120de1ac..b5a13162b61e4 100644
--- a/python/ray/rllib/tuned_examples/atari-duel-ddqn.yaml
+++ b/python/ray/rllib/tuned_examples/atari-duel-ddqn.yaml
@@ -1,3 +1,5 @@
+# Runs on a single g3.4xl node
+# See https://github.com/ray-project/rl-experiments for results
 dueling-ddqn:
     env:
         grid_search:
@@ -27,5 +29,5 @@ dueling-ddqn:
         prioritized_replay_alpha: 0.5
         beta_annealing_fraction: 1.0
         final_prioritized_replay_beta: 1.0
-        gpu: true
+        num_gpus: 0.2
         timesteps_per_iteration: 10000
diff --git a/python/ray/rllib/tuned_examples/atari-impala.yaml b/python/ray/rllib/tuned_examples/atari-impala.yaml
index 85bd801ff83b5..597b41987b3f6 100644
--- a/python/ray/rllib/tuned_examples/atari-impala.yaml
+++ b/python/ray/rllib/tuned_examples/atari-impala.yaml
@@ -9,7 +9,7 @@ atari-impala:
             - SpaceInvadersNoFrameskip-v4 
     run: IMPALA
     config:
-        sample_batch_size: 250  # 50 * num_envs_per_worker
+        sample_batch_size: 50
         train_batch_size: 500
         num_workers: 32
         num_envs_per_worker: 5
diff --git a/python/ray/rllib/tuned_examples/atari-ppo.yaml b/python/ray/rllib/tuned_examples/atari-ppo.yaml
index 24593d6bb9299..c6be6435041ca 100644
--- a/python/ray/rllib/tuned_examples/atari-ppo.yaml
+++ b/python/ray/rllib/tuned_examples/atari-ppo.yaml
@@ -16,7 +16,7 @@ atari-ppo:
         vf_clip_param: 10.0
         entropy_coeff: 0.01
         train_batch_size: 5000
-        sample_batch_size: 500
+        sample_batch_size: 100
         sgd_minibatch_size: 500
         num_sgd_iter: 10
         num_workers: 10
diff --git a/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml b/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml
index 34c60e5219b4e..f02399ab33ff2 100644
--- a/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml
+++ b/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml
@@ -34,8 +34,9 @@ halfcheetah-ddpg:
         clip_rewards: False
 
         # === Optimization ===
-        actor_lr: 0.0001
-        critic_lr: 0.001
+        lr: 0.001
+        actor_loss_coeff: 0.1
+        critic_loss_coeff: 1.0
         use_huber: False
         huber_threshold: 1.0
         l2_reg: 0.000001
diff --git a/python/ray/rllib/tuned_examples/hopper-ppo.yaml b/python/ray/rllib/tuned_examples/hopper-ppo.yaml
index c1c75b166e7cd..5082dc7921e47 100644
--- a/python/ray/rllib/tuned_examples/hopper-ppo.yaml
+++ b/python/ray/rllib/tuned_examples/hopper-ppo.yaml
@@ -10,3 +10,4 @@ hopper-ppo:
         train_batch_size: 160000
         num_workers: 64
         num_gpus: 4
+        batch_mode: complete_episodes
diff --git a/python/ray/rllib/tuned_examples/humanoid-ppo-gae.yaml b/python/ray/rllib/tuned_examples/humanoid-ppo-gae.yaml
index e176dcae26c67..9473b5df7a6a3 100644
--- a/python/ray/rllib/tuned_examples/humanoid-ppo-gae.yaml
+++ b/python/ray/rllib/tuned_examples/humanoid-ppo-gae.yaml
@@ -17,3 +17,4 @@ humanoid-ppo-gae:
             free_log_std: true
         num_workers: 64
         num_gpus: 4
+        batch_mode: complete_episodes
diff --git a/python/ray/rllib/tuned_examples/humanoid-ppo.yaml b/python/ray/rllib/tuned_examples/humanoid-ppo.yaml
index 0608f8b60353c..07371d16f712b 100644
--- a/python/ray/rllib/tuned_examples/humanoid-ppo.yaml
+++ b/python/ray/rllib/tuned_examples/humanoid-ppo.yaml
@@ -15,3 +15,4 @@ humanoid-ppo:
         use_gae: false
         num_workers: 64
         num_gpus: 4
+        batch_mode: complete_episodes
diff --git a/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml b/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml
index a71b1e98ff658..e74b2e0f138e8 100644
--- a/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml
+++ b/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml
@@ -34,8 +34,9 @@ mountaincarcontinuous-ddpg:
         clip_rewards: False
 
         # === Optimization ===
-        actor_lr: 0.0001
-        critic_lr: 0.001
+        lr: 0.001
+        actor_loss_coeff: 0.1
+        critic_loss_coeff: 1.0
         use_huber: False
         huber_threshold: 1.0
         l2_reg: 0.00001
diff --git a/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml b/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml
index 3cf68bcdc23e4..e28eee3e8e216 100644
--- a/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml
+++ b/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml
@@ -34,8 +34,9 @@ pendulum-ddpg:
         clip_rewards: False
 
         # === Optimization ===
-        actor_lr: 0.0001
-        critic_lr: 0.001
+        lr: 0.001
+        actor_loss_coeff: 0.1
+        critic_loss_coeff: 1.0
         use_huber: True
         huber_threshold: 1.0
         l2_reg: 0.000001
diff --git a/python/ray/rllib/tuned_examples/pendulum-ppo.yaml b/python/ray/rllib/tuned_examples/pendulum-ppo.yaml
index 60df6825bd435..b8c0293a3e338 100644
--- a/python/ray/rllib/tuned_examples/pendulum-ppo.yaml
+++ b/python/ray/rllib/tuned_examples/pendulum-ppo.yaml
@@ -13,4 +13,4 @@ pendulum-ppo:
         num_sgd_iter: 10
         model:
             fcnet_hiddens: [64, 64]
-            squash_to_range: True
+        batch_mode: complete_episodes
diff --git a/python/ray/rllib/tuned_examples/pendulum-td3.yaml b/python/ray/rllib/tuned_examples/pendulum-td3.yaml
new file mode 100644
index 0000000000000..25b0900d63c2a
--- /dev/null
+++ b/python/ray/rllib/tuned_examples/pendulum-td3.yaml
@@ -0,0 +1,60 @@
+# This configuration can expect to reach -160 reward in 10k-20k timesteps
+pendulum-ddpg:
+    env: Pendulum-v0
+    run: DDPG
+    stop:
+        episode_reward_mean: -160
+        time_total_s: 600 # 10 minutes
+    config:
+        # === Tricks ===
+        twin_q: True
+        policy_delay: 2
+        smooth_target_policy: True
+        act_noise: 0.1
+        target_noise: 0.2
+        noise_clip: 0.5
+
+        # === Model ===
+        actor_hiddens: [64, 64]
+        critic_hiddens: [64, 64]
+        n_step: 1
+        model: {}
+        gamma: 0.99
+        env_config: {}
+
+        # === Exploration ===
+        schedule_max_timesteps: 100000
+        timesteps_per_iteration: 600
+        exploration_fraction: 0.1
+        exploration_final_eps: 0.02
+        noise_scale: 0.1
+        exploration_theta: 0.15
+        exploration_sigma: 0.2
+        target_network_update_freq: 0
+        tau: 0.001
+
+        # === Replay buffer ===
+        buffer_size: 10000
+        prioritized_replay: True
+        prioritized_replay_alpha: 0.6
+        prioritized_replay_beta: 0.4
+        prioritized_replay_eps: 0.000001
+        clip_rewards: False
+
+        # === Optimization ===
+        lr: 0.001
+        actor_loss_coeff: 0.1
+        critic_loss_coeff: 1.0
+        use_huber: True
+        huber_threshold: 1.0
+        l2_reg: 0.000001
+        learning_starts: 500
+        sample_batch_size: 1
+        train_batch_size: 64
+
+        # === Parallelism ===
+        num_workers: 0
+        num_gpus_per_worker: 0
+        optimizer_class: "SyncReplayOptimizer"
+        per_worker_exploration: False
+        worker_side_prioritization: False
diff --git a/python/ray/rllib/tuned_examples/pong-a3c-pytorch.yaml b/python/ray/rllib/tuned_examples/pong-a3c-pytorch.yaml
index 891c4b9919277..c3f608ddccb66 100644
--- a/python/ray/rllib/tuned_examples/pong-a3c-pytorch.yaml
+++ b/python/ray/rllib/tuned_examples/pong-a3c-pytorch.yaml
@@ -15,7 +15,7 @@ pong-a3c-pytorch-cnn:
         model:
             use_lstm: false
             channel_major: true
-            dim: 80
+            dim: 84
             grayscale: true
             zero_mean: false
         optimizer:
diff --git a/python/ray/rllib/tuned_examples/pong-dqn.yaml b/python/ray/rllib/tuned_examples/pong-dqn.yaml
index a0d39cc3dadc2..2c3e5a877ed4c 100644
--- a/python/ray/rllib/tuned_examples/pong-dqn.yaml
+++ b/python/ray/rllib/tuned_examples/pong-dqn.yaml
@@ -6,7 +6,7 @@ pong-deterministic-dqn:
         episode_reward_mean: 20
         time_total_s: 7200
     config:
-        gpu: True
+        num_gpus: 1
         gamma: 0.99
         lr: .0001
         learning_starts: 10000
diff --git a/python/ray/rllib/tuned_examples/pong-impala-fast.yaml b/python/ray/rllib/tuned_examples/pong-impala-fast.yaml
new file mode 100644
index 0000000000000..3c29f4e0c08e4
--- /dev/null
+++ b/python/ray/rllib/tuned_examples/pong-impala-fast.yaml
@@ -0,0 +1,19 @@
+# This can reach 18-19 reward in ~3 minutes on p3.16xl head w/m4.16xl workers
+#   128 workers -> 3 minutes (best case)
+#    64 workers -> 4 minutes
+#    32 workers -> 7 minutes
+# See also: pong-impala.yaml, pong-impala-vectorized.yaml
+pong-impala-fast:
+    env: PongNoFrameskip-v4
+    run: IMPALA
+    config:
+        sample_batch_size: 50
+        train_batch_size: 1000
+        num_workers: 128
+        num_envs_per_worker: 5
+        broadcast_interval: 5
+        max_sample_requests_in_flight_per_worker: 1
+        num_parallel_data_loaders: 4
+        num_gpus: 2
+        model:
+          dim: 42
diff --git a/python/ray/rllib/tuned_examples/pong-impala-vectorized.yaml b/python/ray/rllib/tuned_examples/pong-impala-vectorized.yaml
index 9525f4115521e..b16488b443b80 100644
--- a/python/ray/rllib/tuned_examples/pong-impala-vectorized.yaml
+++ b/python/ray/rllib/tuned_examples/pong-impala-vectorized.yaml
@@ -5,7 +5,7 @@ pong-impala-vectorized:
     env: PongNoFrameskip-v4
     run: IMPALA
     config:
-        sample_batch_size: 500  # 50 * num_envs_per_worker
+        sample_batch_size: 50
         train_batch_size: 500
         num_workers: 32
         num_envs_per_worker: 10
diff --git a/python/ray/rllib/tuned_examples/pong-impala.yaml b/python/ray/rllib/tuned_examples/pong-impala.yaml
index b54c79849c5ab..527bc905d8e57 100644
--- a/python/ray/rllib/tuned_examples/pong-impala.yaml
+++ b/python/ray/rllib/tuned_examples/pong-impala.yaml
@@ -2,7 +2,7 @@
 #   128 workers -> 8 minutes
 #    32 workers -> 17 minutes
 #    16 workers -> 40 min+
-# See also: pong-impala-vectorized.yaml
+# See also: pong-impala-fast.yaml, pong-impala-vectorized.yaml
 pong-impala:
     env: PongNoFrameskip-v4
     run: IMPALA
diff --git a/python/ray/rllib/tuned_examples/pong-ppo.yaml b/python/ray/rllib/tuned_examples/pong-ppo.yaml
index 1447481643fe5..d7e273cc6e2bd 100644
--- a/python/ray/rllib/tuned_examples/pong-ppo.yaml
+++ b/python/ray/rllib/tuned_examples/pong-ppo.yaml
@@ -1,17 +1,26 @@
-# On a Tesla K80 GPU, this achieves the maximum reward in about 1-1.5 hours.
+# On a single GPU, this achieves maximum reward in ~15-20 minutes.
 #
-# $ python train.py -f tuned_examples/pong-ppo.yaml --ray-num-gpus=1
+# $ python train.py -f tuned_examples/pong-ppo.yaml
 #
-# - PPO_PongDeterministic-v4_0:  TERMINATED [pid=16387], 4984 s, 1117981 ts, 21 rew
-# - PPO_PongDeterministic-v4_0:  TERMINATED [pid=83606], 4592 s, 1068671 ts, 21 rew
-#
-pong-deterministic-ppo:
-    env: PongDeterministic-v4
+pong-ppo:
+    env: PongNoFrameskip-v4
     run: PPO
-    stop:
-        episode_reward_mean: 21
     config:
-        gamma: 0.99
-        num_workers: 4
-        num_sgd_iter: 20
+        lambda: 0.95
+        kl_coeff: 0.5
+        clip_rewards: True
+        clip_param: 0.1
+        vf_clip_param: 10.0
+        entropy_coeff: 0.01
+        train_batch_size: 5000
+        sample_batch_size: 20
+        sgd_minibatch_size: 500
+        num_sgd_iter: 10
+        num_workers: 32
+        num_envs_per_worker: 5
+        batch_mode: truncate_episodes
+        observation_filter: NoFilter
+        vf_share_layers: true
         num_gpus: 1
+        model:
+            dim: 42
diff --git a/python/ray/rllib/tuned_examples/regression_tests/cartpole-ppo.yaml b/python/ray/rllib/tuned_examples/regression_tests/cartpole-ppo.yaml
index 425958e5c109f..82ea5846e733c 100644
--- a/python/ray/rllib/tuned_examples/regression_tests/cartpole-ppo.yaml
+++ b/python/ray/rllib/tuned_examples/regression_tests/cartpole-ppo.yaml
@@ -6,3 +6,4 @@ cartpole-ppo:
         time_total_s: 300
     config:
         num_workers: 1
+        batch_mode: complete_episodes
diff --git a/python/ray/rllib/tuned_examples/regression_tests/pendulum-ppo.yaml b/python/ray/rllib/tuned_examples/regression_tests/pendulum-ppo.yaml
index 8b9d69fce20a6..63536d3be3704 100644
--- a/python/ray/rllib/tuned_examples/regression_tests/pendulum-ppo.yaml
+++ b/python/ray/rllib/tuned_examples/regression_tests/pendulum-ppo.yaml
@@ -15,3 +15,4 @@ pendulum-ppo:
         num_sgd_iter: 10
         model:
             fcnet_hiddens: [64, 64]
+        batch_mode: complete_episodes
diff --git a/python/ray/rllib/tuned_examples/swimmer-ars.yaml b/python/ray/rllib/tuned_examples/swimmer-ars.yaml
index 338c8a12c2cfc..effb4cfe19a8a 100644
--- a/python/ray/rllib/tuned_examples/swimmer-ars.yaml
+++ b/python/ray/rllib/tuned_examples/swimmer-ars.yaml
@@ -9,8 +9,9 @@ swimmer-ars:
         num_workers: 1
         sgd_stepsize: 0.02
         noise_size: 250000000
-        policy_type: LinearPolicy
         eval_prob: 0.2
         offset: 0
         observation_filter: NoFilter
         report_length: 3
+        model:
+            fcnet_hiddens: []  # a linear policy
diff --git a/python/ray/rllib/tuned_examples/walker2d-ppo.yaml b/python/ray/rllib/tuned_examples/walker2d-ppo.yaml
index deb5a0038dcb7..9d64720a2c5b6 100644
--- a/python/ray/rllib/tuned_examples/walker2d-ppo.yaml
+++ b/python/ray/rllib/tuned_examples/walker2d-ppo.yaml
@@ -9,3 +9,4 @@ walker2d-v1-ppo:
         train_batch_size: 320000
         num_workers: 64
         num_gpus: 4
+        batch_mode: complete_episodes
diff --git a/python/ray/rllib/utils/actors.py b/python/ray/rllib/utils/actors.py
index e865feb431b4b..7018073313112 100644
--- a/python/ray/rllib/utils/actors.py
+++ b/python/ray/rllib/utils/actors.py
@@ -2,9 +2,12 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
 import os
 import ray
 
+logger = logging.getLogger(__name__)
+
 
 class TaskPool(object):
     """Helper class for tracking the status of many in-flight actor tasks."""
@@ -36,11 +39,8 @@ def completed_prefetch(self):
 
         for worker, obj_id in self.completed():
             plasma_id = ray.pyarrow.plasma.ObjectID(obj_id.id())
-            if not ray.global_state.use_raylet:
-                ray.worker.global_worker.plasma_client.fetch([plasma_id])
-            else:
-                (ray.worker.global_worker.local_scheduler_client.
-                 reconstruct_objects([obj_id], True))
+            (ray.worker.global_worker.local_scheduler_client.
+             fetch_or_reconstruct([obj_id], True))
             self._fetching.append((worker, obj_id))
 
         remaining = []
@@ -80,11 +80,12 @@ def split_colocated(actors):
 def try_create_colocated(cls, args, count):
     actors = [cls.remote(*args) for _ in range(count)]
     local, _ = split_colocated(actors)
-    print("Got {} colocated actors of {}".format(len(local), count))
+    logger.info("Got {} colocated actors of {}".format(len(local), count))
     return local
 
 
 def create_colocated(cls, args, count):
+    logger.info("Trying to create {} colocated actors".format(count))
     ok = []
     i = 1
     while len(ok) < count and i < 10:
diff --git a/python/ray/rllib/utils/annotations.py b/python/ray/rllib/utils/annotations.py
new file mode 100644
index 0000000000000..d68f76a69600e
--- /dev/null
+++ b/python/ray/rllib/utils/annotations.py
@@ -0,0 +1,20 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+
+def override(cls):
+    """Annotation for documenting method overrides.
+
+    Arguments:
+        cls (type): The superclass that provides the overriden method. If this
+            cls does not actually have the method, an error is raised.
+    """
+
+    def check_override(method):
+        if method.__name__ not in dir(cls):
+            raise NameError("{} does not override any method of {}".format(
+                method, cls))
+        return method
+
+    return check_override
diff --git a/python/ray/rllib/utils/compression.py b/python/ray/rllib/utils/compression.py
index 5f28455ee44aa..aed0dd5985600 100644
--- a/python/ray/rllib/utils/compression.py
+++ b/python/ray/rllib/utils/compression.py
@@ -2,18 +2,21 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
 import time
 import base64
 import numpy as np
 import pyarrow
 
+logger = logging.getLogger(__name__)
+
 try:
     import lz4.frame
     LZ4_ENABLED = True
 except ImportError:
-    print("WARNING: lz4 not available, disabling sample compression. "
-          "This will significantly impact RLlib performance. "
-          "To install lz4, run `pip install lz4`.")
+    logger.warn("lz4 not available, disabling sample compression. "
+                "This will significantly impact RLlib performance. "
+                "To install lz4, run `pip install lz4`.")
     LZ4_ENABLED = False
 
 
diff --git a/python/ray/rllib/utils/filter.py b/python/ray/rllib/utils/filter.py
index b2a3619481cdd..9a1f37dbd15a5 100644
--- a/python/ray/rllib/utils/filter.py
+++ b/python/ray/rllib/utils/filter.py
@@ -2,9 +2,12 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
 import numpy as np
 import threading
 
+logger = logging.getLogger(__name__)
+
 
 class Filter(object):
     """Processes input, possibly statefully."""
@@ -39,7 +42,10 @@ def __init__(self, *args):
         pass
 
     def __call__(self, x, update=True):
-        return np.asarray(x)
+        try:
+            return np.asarray(x)
+        except Exception:
+            raise ValueError("Failed to convert to array", x)
 
     def apply_changes(self, other, *args, **kwargs):
         pass
@@ -74,8 +80,10 @@ def copy(self):
     def push(self, x):
         x = np.asarray(x)
         # Unvectorized update of the running statistics.
-        assert x.shape == self._M.shape, ("x.shape = {}, self.shape = {}"
-                                          .format(x.shape, self._M.shape))
+        if x.shape != self._M.shape:
+            raise ValueError(
+                "Unexpected input shape {}, expected {}, value = {}".format(
+                    x.shape, self._M.shape, x))
         n1 = self._n
         self._n += 1
         if self._n == 1:
diff --git a/python/ray/rllib/utils/policy_client.py b/python/ray/rllib/utils/policy_client.py
index 901dc983b0985..1bb4b5e134046 100644
--- a/python/ray/rllib/utils/policy_client.py
+++ b/python/ray/rllib/utils/policy_client.py
@@ -2,14 +2,17 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
 import pickle
 
+logger = logging.getLogger(__name__)
+
 try:
     import requests  # `requests` is not part of stdlib.
 except ImportError:
     requests = None
-    print("Couldn't import `requests` library. Be sure to install it on"
-          " the client side.")
+    logger.warn("Couldn't import `requests` library. Be sure to install it on"
+                " the client side.")
 
 
 class PolicyClient(object):
@@ -109,8 +112,7 @@ def _send(self, data):
         payload = pickle.dumps(data)
         response = requests.post(self._address, data=payload)
         if response.status_code != 200:
-            print("Request failed", data)
-            print(response.text)
+            logger.error("Request failed {}: {}".format(response.text, data))
         response.raise_for_status()
         parsed = pickle.loads(response.content)
         return parsed
diff --git a/python/ray/rllib/utils/policy_server.py b/python/ray/rllib/utils/policy_server.py
index 13ca376bb82ab..25238971fd139 100644
--- a/python/ray/rllib/utils/policy_server.py
+++ b/python/ray/rllib/utils/policy_server.py
@@ -18,15 +18,15 @@
 
 
 class PolicyServer(ThreadingMixIn, HTTPServer):
-    """REST server than can be launched from a ServingEnv.
+    """REST server than can be launched from a ExternalEnv.
 
     This launches a multi-threaded server that listens on the specified host
     and port to serve policy requests and forward experiences to RLlib.
 
     Examples:
-        >>> class CartpoleServing(ServingEnv):
+        >>> class CartpoleServing(ExternalEnv):
                def __init__(self):
-                   ServingEnv.__init__(
+                   ExternalEnv.__init__(
                        self, spaces.Discrete(2),
                        spaces.Box(
                            low=-10,
@@ -50,12 +50,12 @@ def run(self):
         >>> client.log_returns(eps_id, reward)
     """
 
-    def __init__(self, serving_env, address, port):
-        handler = _make_handler(serving_env)
+    def __init__(self, external_env, address, port):
+        handler = _make_handler(external_env)
         HTTPServer.__init__(self, (address, port), handler)
 
 
-def _make_handler(serving_env):
+def _make_handler(external_env):
     class Handler(SimpleHTTPRequestHandler):
         def do_POST(self):
             content_len = int(self.headers.get('Content-Length'), 0)
@@ -73,20 +73,20 @@ def execute_command(self, args):
             command = args["command"]
             response = {}
             if command == PolicyClient.START_EPISODE:
-                response["episode_id"] = serving_env.start_episode(
+                response["episode_id"] = external_env.start_episode(
                     args["episode_id"], args["training_enabled"])
             elif command == PolicyClient.GET_ACTION:
-                response["action"] = serving_env.get_action(
+                response["action"] = external_env.get_action(
                     args["episode_id"], args["observation"])
             elif command == PolicyClient.LOG_ACTION:
-                serving_env.log_action(args["episode_id"], args["observation"],
-                                       args["action"])
+                external_env.log_action(args["episode_id"],
+                                        args["observation"], args["action"])
             elif command == PolicyClient.LOG_RETURNS:
-                serving_env.log_returns(args["episode_id"], args["reward"],
-                                        args["info"])
+                external_env.log_returns(args["episode_id"], args["reward"],
+                                         args["info"])
             elif command == PolicyClient.END_EPISODE:
-                serving_env.end_episode(args["episode_id"],
-                                        args["observation"])
+                external_env.end_episode(args["episode_id"],
+                                         args["observation"])
             else:
                 raise Exception("Unknown command: {}".format(command))
             return response
diff --git a/python/ray/rllib/utils/reshaper.py b/python/ray/rllib/utils/reshaper.py
deleted file mode 100644
index e9c16521210c4..0000000000000
--- a/python/ray/rllib/utils/reshaper.py
+++ /dev/null
@@ -1,49 +0,0 @@
-import numpy as np
-import tensorflow as tf
-
-
-class Reshaper(object):
-    """
-    This class keeps track of where in the flattened observation space
-    we should be slicing and what the new shapes should be
-    """
-
-    def __init__(self, env_space):
-        self.shapes = []
-        self.slice_positions = []
-        self.env_space = env_space
-        if isinstance(env_space, list):
-            for space in env_space:
-                # Handle both gym arrays and just lists of inputs length
-                if hasattr(space, "n"):
-                    arr_shape = np.asarray([1])  # discrete space
-                elif hasattr(space, "shape"):
-                    arr_shape = np.asarray(space.shape)
-                else:
-                    arr_shape = space
-                self.shapes.append(arr_shape)
-                if len(self.slice_positions) == 0:
-                    self.slice_positions.append(np.product(arr_shape))
-                else:
-                    self.slice_positions.append(
-                        np.product(arr_shape) + self.slice_positions[-1])
-        else:
-            self.shapes.append(np.asarray(env_space.shape))
-            self.slice_positions.append(np.product(env_space.shape))
-
-    def get_slice_lengths(self):
-        diffed_list = np.diff(self.slice_positions).tolist()
-        diffed_list.insert(0, self.slice_positions[0])
-        return np.asarray(diffed_list).astype(int)
-
-    def split_tensor(self, tensor, axis=-1):
-        # FIXME (ev) This won't work for mixed action distributions like
-        # one agent Gaussian one agent discrete
-        slice_rescale = int(tensor.shape.as_list()[axis] / int(
-            np.sum(self.get_slice_lengths())))
-        return tf.split(
-            tensor, slice_rescale * self.get_slice_lengths(), axis=axis)
-
-    def split_number(self, number):
-        slice_rescale = int(number / int(np.sum(self.get_slice_lengths())))
-        return slice_rescale * self.get_slice_lengths()
diff --git a/python/ray/rllib/utils/tf_run_builder.py b/python/ray/rllib/utils/tf_run_builder.py
index 030642ae5b6ae..4359c1b5e546f 100644
--- a/python/ray/rllib/utils/tf_run_builder.py
+++ b/python/ray/rllib/utils/tf_run_builder.py
@@ -2,12 +2,15 @@
 from __future__ import division
 from __future__ import print_function
 
+import logging
 import os
 import time
 
 import tensorflow as tf
 from tensorflow.python.client import timeline
 
+logger = logging.getLogger(__name__)
+
 
 class TFRunBuilder(object):
     """Used to incrementally build up a TensorFlow run.
@@ -26,7 +29,8 @@ def __init__(self, session, debug_name):
     def add_feed_dict(self, feed_dict):
         assert not self._executed
         for k in feed_dict:
-            assert k not in self.feed_dict
+            if k in self.feed_dict:
+                raise ValueError("Key added twice: {}".format(k))
         self.feed_dict.update(feed_dict)
 
     def add_fetches(self, fetches):
@@ -41,10 +45,9 @@ def get(self, to_fetch):
                 self._executed = run_timeline(
                     self.session, self.fetches, self.debug_name,
                     self.feed_dict, os.environ.get("TF_TIMELINE_DIR"))
-            except Exception as e:
-                print("Error fetching: {}, feed_dict={}".format(
+            except Exception:
+                raise ValueError("Error fetching: {}, feed_dict={}".format(
                     self.fetches, self.feed_dict))
-                raise e
         if isinstance(to_fetch, int):
             return self._executed[to_fetch]
         elif isinstance(to_fetch, list):
@@ -75,8 +78,8 @@ def run_timeline(sess, ops, debug_name, feed_dict={}, timeline_dir=None):
                 debug_name, os.getpid(), _count))
         _count += 1
         trace_file = open(outf, "w")
-        print("Wrote tf timeline ({} s) to {}".format(time.time() - start,
-                                                      os.path.abspath(outf)))
+        logger.info("Wrote tf timeline ({} s) to {}".format(
+            time.time() - start, os.path.abspath(outf)))
         trace_file.write(trace.generate_chrome_trace_format())
     else:
         fetches = sess.run(ops, feed_dict=feed_dict)
diff --git a/python/ray/scripts/scripts.py b/python/ray/scripts/scripts.py
index 0826a1387aec8..b84db6757c86a 100644
--- a/python/ray/scripts/scripts.py
+++ b/python/ray/scripts/scripts.py
@@ -20,7 +20,7 @@
 
 def check_no_existing_redis_clients(node_ip_address, redis_client):
     # The client table prefix must be kept in sync with the file
-    # "src/common/redis_module/ray_redis_module.cc" where it is defined.
+    # "src/ray/gcs/redis_module/ray_redis_module.cc" where it is defined.
     REDIS_CLIENT_TABLE_PREFIX = "CL:"
     client_keys = redis_client.keys("{}*".format(REDIS_CLIENT_TABLE_PREFIX))
     # Filter to clients on the same node and do some basic checking.
@@ -89,6 +89,11 @@ def cli(logging_level, logging_format):
     type=int,
     help=("If provided, attempt to configure Redis with this "
           "maximum number of clients."))
+@click.option(
+    "--redis-password",
+    required=False,
+    type=str,
+    help="If provided, secure Redis ports with this password")
 @click.option(
     "--redis-shard-ports",
     required=False,
@@ -100,12 +105,33 @@ def cli(logging_level, logging_format):
     required=False,
     type=int,
     help="the port to use for starting the object manager")
+@click.option(
+    "--node-manager-port",
+    required=False,
+    type=int,
+    help="the port to use for starting the node manager")
 @click.option(
     "--object-store-memory",
     required=False,
     type=int,
     help="the maximum amount of memory (in bytes) to allow the "
     "object store to use")
+@click.option(
+    "--redis-max-memory",
+    required=False,
+    type=int,
+    help=("The max amount of memory (in bytes) to allow redis to use, or None "
+          "for no limit. Once the limit is exceeded, redis will start LRU "
+          "eviction of entries. This only applies to the sharded "
+          "redis tables (task and object tables)."))
+@click.option(
+    "--collect-profiling-data",
+    default=True,
+    type=bool,
+    help=("Whether to collect profiling data. Note that "
+          "profiling data cannot be LRU evicted, so if you set "
+          "redis_max_memory then profiling will also be disabled to prevent "
+          "it from consuming all available redis memory."))
 @click.option(
     "--num-workers",
     required=False,
@@ -162,11 +188,6 @@ def cli(logging_level, logging_format):
     required=False,
     type=str,
     help="the file that contains the autoscaling config")
-@click.option(
-    "--use-raylet",
-    is_flag=True,
-    default=None,
-    help="use the raylet code path")
 @click.option(
     "--no-redirect-worker-output",
     is_flag=True,
@@ -177,25 +198,40 @@ def cli(logging_level, logging_format):
     is_flag=True,
     default=False,
     help="do not redirect non-worker stdout and stderr to files")
+@click.option(
+    "--plasma-store-socket-name",
+    default=None,
+    help="manually specify the socket name of the plasma store")
+@click.option(
+    "--raylet-socket-name",
+    default=None,
+    help="manually specify the socket path of the raylet process")
+@click.option(
+    "--temp-dir",
+    default=None,
+    help="manually specify the root temporary dir of the Ray process")
+@click.option(
+    "--internal-config",
+    default=None,
+    type=str,
+    help="Do NOT use this. This is for debugging/development purposes ONLY.")
 def start(node_ip_address, redis_address, redis_port, num_redis_shards,
-          redis_max_clients, redis_shard_ports, object_manager_port,
-          object_store_memory, num_workers, num_cpus, num_gpus, resources,
-          head, no_ui, block, plasma_directory, huge_pages, autoscaling_config,
-          use_raylet, no_redirect_worker_output, no_redirect_output):
+          redis_max_clients, redis_password, redis_shard_ports,
+          object_manager_port, node_manager_port, object_store_memory,
+          redis_max_memory, collect_profiling_data, num_workers, num_cpus,
+          num_gpus, resources, head, no_ui, block, plasma_directory,
+          huge_pages, autoscaling_config, no_redirect_worker_output,
+          no_redirect_output, plasma_store_socket_name, raylet_socket_name,
+          temp_dir, internal_config):
     # Convert hostnames to numerical IP address.
     if node_ip_address is not None:
         node_ip_address = services.address_to_ip(node_ip_address)
     if redis_address is not None:
         redis_address = services.address_to_ip(redis_address)
 
-    if use_raylet is None and os.environ.get("RAY_USE_XRAY") == "1":
-        # This environment variable is used in our testing setup.
-        logger.info("Detected environment variable 'RAY_USE_XRAY'.")
-        use_raylet = True
-
     try:
         resources = json.loads(resources)
-    except Exception as e:
+    except Exception:
         raise Exception("Unable to parse the --resources argument using "
                         "json.loads. Try using a format like\n\n"
                         "    --resources='{\"CustomResource1\": 3, "
@@ -235,19 +271,15 @@ def start(node_ip_address, redis_address, redis_port, num_redis_shards,
         logger.info("Using IP address {} for this node."
                     .format(node_ip_address))
 
-        address_info = {}
-        # Use the provided object manager port if there is one.
-        if object_manager_port is not None:
-            address_info["object_manager_ports"] = [object_manager_port]
-        if address_info == {}:
-            address_info = None
-
         address_info = services.start_ray_head(
-            address_info=address_info,
+            object_manager_ports=[object_manager_port],
+            node_manager_ports=[node_manager_port],
             node_ip_address=node_ip_address,
             redis_port=redis_port,
             redis_shard_ports=redis_shard_ports,
             object_store_memory=object_store_memory,
+            redis_max_memory=redis_max_memory,
+            collect_profiling_data=collect_profiling_data,
             num_workers=num_workers,
             cleanup=False,
             redirect_worker_output=not no_redirect_worker_output,
@@ -255,26 +287,33 @@ def start(node_ip_address, redis_address, redis_port, num_redis_shards,
             resources=resources,
             num_redis_shards=num_redis_shards,
             redis_max_clients=redis_max_clients,
-            redis_protected_mode=False,
+            redis_password=redis_password,
             include_webui=(not no_ui),
             plasma_directory=plasma_directory,
             huge_pages=huge_pages,
             autoscaling_config=autoscaling_config,
-            use_raylet=use_raylet)
+            plasma_store_socket_name=plasma_store_socket_name,
+            raylet_socket_name=raylet_socket_name,
+            temp_dir=temp_dir,
+            _internal_config=internal_config)
         logger.info(address_info)
         logger.info(
             "\nStarted Ray on this node. You can add additional nodes to "
             "the cluster by calling\n\n"
-            "    ray start --redis-address {}\n\n"
+            "    ray start --redis-address {}{}{}\n\n"
             "from the node you wish to add. You can connect a driver to the "
             "cluster from Python by running\n\n"
             "    import ray\n"
-            "    ray.init(redis_address=\"{}\")\n\n"
+            "    ray.init(redis_address=\"{}{}{}\")\n\n"
             "If you have trouble connecting from a different machine, check "
             "that your firewall is configured properly. If you wish to "
             "terminate the processes that have been started, run\n\n"
-            "    ray stop".format(address_info["redis_address"],
-                                  address_info["redis_address"]))
+            "    ray stop".format(
+                address_info["redis_address"], " --redis-password "
+                if redis_password else "", redis_password if redis_password
+                else "", address_info["redis_address"], "\", redis_password=\""
+                if redis_password else "", redis_password
+                if redis_password else ""))
     else:
         # Start Ray on a non-head node.
         if redis_port is not None:
@@ -299,10 +338,12 @@ def start(node_ip_address, redis_address, redis_port, num_redis_shards,
 
         # Wait for the Redis server to be started. And throw an exception if we
         # can't connect to it.
-        services.wait_for_redis_to_start(redis_ip_address, int(redis_port))
+        services.wait_for_redis_to_start(
+            redis_ip_address, int(redis_port), password=redis_password)
 
         # Create a Redis client.
-        redis_client = services.create_redis_client(redis_address)
+        redis_client = services.create_redis_client(
+            redis_address, password=redis_password)
 
         # Check that the verion information on this node matches the version
         # information that the cluster was started with.
@@ -321,15 +362,20 @@ def start(node_ip_address, redis_address, redis_port, num_redis_shards,
             node_ip_address=node_ip_address,
             redis_address=redis_address,
             object_manager_ports=[object_manager_port],
+            node_manager_ports=[node_manager_port],
             num_workers=num_workers,
             object_store_memory=object_store_memory,
+            redis_password=redis_password,
             cleanup=False,
             redirect_worker_output=not no_redirect_worker_output,
             redirect_output=not no_redirect_output,
             resources=resources,
             plasma_directory=plasma_directory,
             huge_pages=huge_pages,
-            use_raylet=use_raylet)
+            plasma_store_socket_name=plasma_store_socket_name,
+            raylet_socket_name=raylet_socket_name,
+            temp_dir=temp_dir,
+            _internal_config=internal_config)
         logger.info(address_info)
         logger.info("\nStarted Ray on this node. If you wish to terminate the "
                     "processes that have been started, run\n\n"
@@ -344,11 +390,7 @@ def start(node_ip_address, redis_address, redis_port, num_redis_shards,
 @cli.command()
 def stop():
     subprocess.call(
-        [
-            "killall global_scheduler plasma_store_server plasma_manager "
-            "local_scheduler raylet raylet_monitor"
-        ],
-        shell=True)
+        ["killall plasma_store_server raylet raylet_monitor"], shell=True)
 
     # Find the PID of the monitor process and kill it.
     subprocess.call(
@@ -373,6 +415,12 @@ def stop():
             "grep -v grep | awk '{ print $2 }') 2> /dev/null"
         ],
         shell=True)
+    subprocess.call(
+        [
+            "kill -9 $(ps aux | grep ' ray_' | "
+            "grep -v grep | awk '{ print $2 }') 2> /dev/null"
+        ],
+        shell=True)
 
     # Find the PID of the Ray log monitor process and kill it.
     subprocess.call(
@@ -387,10 +435,10 @@ def stop():
         from notebook.notebookapp import list_running_servers
         pids = [
             str(server["pid"]) for server in list_running_servers()
-            if "/tmp/raylogs" in server["notebook_dir"]
+            if "/tmp/ray" in server["notebook_dir"]
         ]
         subprocess.call(
-            ["kill {} 2> /dev/null".format(" ".join(pids))], shell=True)
+            ["kill -9 {} 2> /dev/null".format(" ".join(pids))], shell=True)
     except ImportError:
         pass
 
@@ -413,24 +461,24 @@ def stop():
     "--min-workers",
     required=False,
     type=int,
-    help=("Override the configured min worker node count for the cluster."))
+    help="Override the configured min worker node count for the cluster.")
 @click.option(
     "--max-workers",
     required=False,
     type=int,
-    help=("Override the configured max worker node count for the cluster."))
+    help="Override the configured max worker node count for the cluster.")
 @click.option(
     "--cluster-name",
     "-n",
     required=False,
     type=str,
-    help=("Override the configured cluster name."))
+    help="Override the configured cluster name.")
 @click.option(
     "--yes",
     "-y",
     is_flag=True,
     default=False,
-    help=("Don't ask for confirmation."))
+    help="Don't ask for confirmation.")
 def create_or_update(cluster_config_file, min_workers, max_workers, no_restart,
                      restart_only, yes, cluster_name):
     if restart_only or no_restart:
@@ -446,19 +494,19 @@ def create_or_update(cluster_config_file, min_workers, max_workers, no_restart,
     "--workers-only",
     is_flag=True,
     default=False,
-    help=("Only destroy the workers."))
+    help="Only destroy the workers.")
 @click.option(
     "--yes",
     "-y",
     is_flag=True,
     default=False,
-    help=("Don't ask for confirmation."))
+    help="Don't ask for confirmation.")
 @click.option(
     "--cluster-name",
     "-n",
     required=False,
     type=str,
-    help=("Override the configured cluster name."))
+    help="Override the configured cluster name.")
 def teardown(cluster_config_file, yes, workers_only, cluster_name):
     teardown_cluster(cluster_config_file, yes, workers_only, cluster_name)
 
@@ -469,17 +517,17 @@ def teardown(cluster_config_file, yes, workers_only, cluster_name):
     "--start",
     is_flag=True,
     default=False,
-    help=("Start the cluster if needed."))
+    help="Start the cluster if needed.")
 @click.option(
-    "--tmux", is_flag=True, default=False, help=("Run the command in tmux."))
+    "--tmux", is_flag=True, default=False, help="Run the command in tmux.")
 @click.option(
     "--cluster-name",
     "-n",
     required=False,
     type=str,
-    help=("Override the configured cluster name."))
+    help="Override the configured cluster name.")
 @click.option(
-    "--new", "-N", is_flag=True, help=("Force creation of a new screen."))
+    "--new", "-N", is_flag=True, help="Force creation of a new screen.")
 def attach(cluster_config_file, start, tmux, cluster_name, new):
     attach_cluster(cluster_config_file, start, tmux, cluster_name, new)
 
@@ -493,7 +541,7 @@ def attach(cluster_config_file, start, tmux, cluster_name, new):
     "-n",
     required=False,
     type=str,
-    help=("Override the configured cluster name."))
+    help="Override the configured cluster name.")
 def rsync_down(cluster_config_file, source, target, cluster_name):
     rsync(cluster_config_file, source, target, cluster_name, down=True)
 
@@ -507,11 +555,77 @@ def rsync_down(cluster_config_file, source, target, cluster_name):
     "-n",
     required=False,
     type=str,
-    help=("Override the configured cluster name."))
+    help="Override the configured cluster name.")
 def rsync_up(cluster_config_file, source, target, cluster_name):
     rsync(cluster_config_file, source, target, cluster_name, down=False)
 
 
+@cli.command()
+@click.argument("cluster_config_file", required=True, type=str)
+@click.option(
+    "--stop",
+    is_flag=True,
+    default=False,
+    help="Stop the cluster after the command finishes running.")
+@click.option(
+    "--start",
+    is_flag=True,
+    default=False,
+    help="Start the cluster if needed.")
+@click.option(
+    "--screen",
+    is_flag=True,
+    default=False,
+    help="Run the command in a screen.")
+@click.option(
+    "--tmux", is_flag=True, default=False, help="Run the command in tmux.")
+@click.option(
+    "--cluster-name",
+    "-n",
+    required=False,
+    type=str,
+    help="Override the configured cluster name.")
+@click.option(
+    "--port-forward", required=False, type=int, help="Port to forward.")
+@click.argument("script", required=True, type=str)
+@click.argument("script_args", required=False, type=str, nargs=-1)
+def submit(cluster_config_file, screen, tmux, stop, start, cluster_name,
+           port_forward, script, script_args):
+    """Uploads and runs a script on the specified cluster.
+
+    The script is automatically synced to the following location:
+
+        os.path.join("~", os.path.basename(script))
+    """
+    assert not (screen and tmux), "Can specify only one of `screen` or `tmux`."
+
+    if start:
+        create_or_update_cluster(cluster_config_file, None, None, False, False,
+                                 True, cluster_name)
+
+    target = os.path.join("~", os.path.basename(script))
+    rsync(cluster_config_file, script, target, cluster_name, down=False)
+
+    cmd = " ".join(["python", target] + list(script_args))
+    exec_cluster(cluster_config_file, cmd, screen, tmux, stop, False,
+                 cluster_name, port_forward)
+
+    if tmux or screen:
+        attach_command_parts = ["ray attach", cluster_config_file]
+        if cluster_name is not None:
+            attach_command_parts.append(
+                "--cluster-name={}".format(cluster_name))
+        if tmux:
+            attach_command_parts.append("--tmux")
+        elif screen:
+            attach_command_parts.append("--screen")
+
+        attach_command = " ".join(attach_command_parts)
+        attach_info = "Use `{}` to check on command status.".format(
+            attach_command)
+        logger.info(attach_info)
+
+
 @cli.command()
 @click.argument("cluster_config_file", required=True, type=str)
 @click.argument("cmd", required=True, type=str)
@@ -519,35 +633,48 @@ def rsync_up(cluster_config_file, source, target, cluster_name):
     "--stop",
     is_flag=True,
     default=False,
-    help=("Stop the cluster after the command finishes running."))
+    help="Stop the cluster after the command finishes running.")
 @click.option(
     "--start",
     is_flag=True,
     default=False,
-    help=("Start the cluster if needed."))
+    help="Start the cluster if needed.")
 @click.option(
     "--screen",
     is_flag=True,
     default=False,
-    help=("Run the command in a screen."))
+    help="Run the command in a screen.")
 @click.option(
-    "--tmux", is_flag=True, default=False, help=("Run the command in tmux."))
+    "--tmux", is_flag=True, default=False, help="Run the command in tmux.")
 @click.option(
     "--cluster-name",
     "-n",
     required=False,
     type=str,
-    help=("Override the configured cluster name."))
+    help="Override the configured cluster name.")
 @click.option(
-    "--port-forward", required=False, type=int, help=("Port to forward."))
+    "--port-forward", required=False, type=int, help="Port to forward.")
 def exec_cmd(cluster_config_file, cmd, screen, tmux, stop, start, cluster_name,
              port_forward):
     assert not (screen and tmux), "Can specify only one of `screen` or `tmux`."
+
     exec_cluster(cluster_config_file, cmd, screen, tmux, stop, start,
                  cluster_name, port_forward)
-    if tmux:
-        logger.info("Use `ray attach {} --tmux` "
-                    "to check on command status.".format(cluster_config_file))
+
+    if tmux or screen:
+        attach_command_parts = ["ray attach", cluster_config_file]
+        if cluster_name is not None:
+            attach_command_parts.append(
+                "--cluster-name={}".format(cluster_name))
+        if tmux:
+            attach_command_parts.append("--tmux")
+        elif screen:
+            attach_command_parts.append("--screen")
+
+        attach_command = " ".join(attach_command_parts)
+        attach_info = "Use `{}` to check on command status.".format(
+            attach_command)
+        logger.info(attach_info)
 
 
 @cli.command()
@@ -557,22 +684,49 @@ def exec_cmd(cluster_config_file, cmd, screen, tmux, stop, start, cluster_name,
     "-n",
     required=False,
     type=str,
-    help=("Override the configured cluster name."))
+    help="Override the configured cluster name.")
 def get_head_ip(cluster_config_file, cluster_name):
     click.echo(get_head_node_ip(cluster_config_file, cluster_name))
 
 
+@cli.command()
+def stack():
+    COMMAND = """
+pyspy=`which py-spy`
+if [ ! -e "$pyspy" ]; then
+    echo "ERROR: Please 'pip install py-spy' (or ray[debug]) first"
+    exit 1
+fi
+# Set IFS to iterate over lines instead of over words.
+export IFS="
+"
+# Call sudo to prompt for password before anything has been printed.
+sudo true
+workers=$(
+    ps aux | grep ' ray_' | grep -v grep
+)
+for worker in $workers; do
+    echo "Stack dump for $worker";
+    pid=`echo $worker | awk '{print $2}'`;
+    sudo $pyspy --pid $pid --dump;
+    echo;
+done
+    """
+    subprocess.call(COMMAND, shell=True)
+
+
 cli.add_command(start)
 cli.add_command(stop)
-cli.add_command(create_or_update)
 cli.add_command(create_or_update, name="up")
 cli.add_command(attach)
 cli.add_command(exec_cmd, name="exec")
-cli.add_command(rsync_down)
-cli.add_command(rsync_up)
+cli.add_command(rsync_down, name="rsync_down")
+cli.add_command(rsync_up, name="rsync_up")
+cli.add_command(submit)
 cli.add_command(teardown)
 cli.add_command(teardown, name="down")
-cli.add_command(get_head_ip)
+cli.add_command(get_head_ip, name="get_head_ip")
+cli.add_command(stack)
 
 
 def main():
diff --git a/python/ray/services.py b/python/ray/services.py
index 3a421437c5664..e96196b5f9463 100644
--- a/python/ray/services.py
+++ b/python/ray/services.py
@@ -2,43 +2,43 @@
 from __future__ import division
 from __future__ import print_function
 
-import binascii
 import json
 import logging
 import multiprocessing
 import os
 import random
 import resource
-import shutil
 import signal
 import socket
 import subprocess
 import sys
 import threading
 import time
-from collections import OrderedDict, namedtuple
-from datetime import datetime
-
+from collections import OrderedDict
 import redis
 
 import pyarrow
 # Ray modules
 import ray.ray_constants
-import ray.global_scheduler as global_scheduler
-import ray.local_scheduler
 import ray.plasma
 
+from ray.tempfile_services import (
+    get_ipython_notebook_path, get_logs_dir_path, get_raylet_socket_name,
+    get_temp_root, new_log_monitor_log_file, new_monitor_log_file,
+    new_plasma_store_log_file, new_raylet_log_file, new_redis_log_file,
+    new_webui_log_file, set_temp_root)
+
 PROCESS_TYPE_MONITOR = "monitor"
 PROCESS_TYPE_LOG_MONITOR = "log_monitor"
 PROCESS_TYPE_WORKER = "worker"
 PROCESS_TYPE_RAYLET = "raylet"
-PROCESS_TYPE_LOCAL_SCHEDULER = "local_scheduler"
-PROCESS_TYPE_PLASMA_MANAGER = "plasma_manager"
 PROCESS_TYPE_PLASMA_STORE = "plasma_store"
-PROCESS_TYPE_GLOBAL_SCHEDULER = "global_scheduler"
 PROCESS_TYPE_REDIS_SERVER = "redis_server"
 PROCESS_TYPE_WEB_UI = "web_ui"
 
+# Max bytes to allocate to plasma unless overriden by the user
+MAX_DEFAULT_MEM = 20 * 1000 * 1000 * 1000
+
 # This is a dictionary tracking all of the processes of different types that
 # have been started by this services module. Note that the order of the keys is
 # important because it determines the order in which these processes will be
@@ -47,23 +47,20 @@
 all_processes = OrderedDict(
     [(PROCESS_TYPE_MONITOR, []), (PROCESS_TYPE_LOG_MONITOR, []),
      (PROCESS_TYPE_WORKER, []), (PROCESS_TYPE_RAYLET, []),
-     (PROCESS_TYPE_LOCAL_SCHEDULER, []), (PROCESS_TYPE_PLASMA_MANAGER, []),
-     (PROCESS_TYPE_PLASMA_STORE, []), (PROCESS_TYPE_GLOBAL_SCHEDULER, []),
-     (PROCESS_TYPE_REDIS_SERVER, []), (PROCESS_TYPE_WEB_UI, [])], )
+     (PROCESS_TYPE_PLASMA_STORE, []), (PROCESS_TYPE_REDIS_SERVER, []),
+     (PROCESS_TYPE_WEB_UI, [])], )
 
 # True if processes are run in the valgrind profiler.
 RUN_RAYLET_PROFILER = False
-RUN_LOCAL_SCHEDULER_PROFILER = False
-RUN_PLASMA_MANAGER_PROFILER = False
 RUN_PLASMA_STORE_PROFILER = False
 
 # Location of the redis server and module.
 REDIS_EXECUTABLE = os.path.join(
     os.path.abspath(os.path.dirname(__file__)),
-    "core/src/common/thirdparty/redis/src/redis-server")
+    "core/src/ray/thirdparty/redis/src/redis-server")
 REDIS_MODULE = os.path.join(
     os.path.abspath(os.path.dirname(__file__)),
-    "core/src/common/redis_module/libray_redis_module.so")
+    "core/src/ray/gcs/redis_module/libray_redis_module.so")
 
 # Location of the credis server and modules.
 # credis will be enabled if the environment variable RAY_USE_NEW_GCS is set.
@@ -84,14 +81,6 @@
 RAYLET_EXECUTABLE = os.path.join(
     os.path.abspath(os.path.dirname(__file__)), "core/src/ray/raylet/raylet")
 
-# ObjectStoreAddress tuples contain all information necessary to connect to an
-# object store. The fields are:
-# - name: The socket name for the object store
-# - manager_name: The socket name for the object store manager
-# - manager_port: The Internet port that the object store manager listens on
-ObjectStoreAddress = namedtuple("ObjectStoreAddress",
-                                ["name", "manager_name", "manager_port"])
-
 # Logger for this module. It should be configured at the entry point
 # into the program using Ray. Ray configures it by default automatically
 # using logging.basicConfig in its entry/init points.
@@ -120,10 +109,6 @@ def new_port():
     return random.randint(10000, 65535)
 
 
-def random_name():
-    return str(random.randint(0, 99999999))
-
-
 def kill_process(p):
     """Kill a process.
 
@@ -136,10 +121,7 @@ def kill_process(p):
     if p.poll() is not None:
         # The process has already terminated.
         return True
-    if any([
-            RUN_RAYLET_PROFILER, RUN_LOCAL_SCHEDULER_PROFILER,
-            RUN_PLASMA_MANAGER_PROFILER, RUN_PLASMA_STORE_PROFILER
-    ]):
+    if any([RUN_RAYLET_PROFILER, RUN_PLASMA_STORE_PROFILER]):
         # Give process signal to write profiler data.
         os.kill(p.pid, signal.SIGINT)
         # Wait for profiling data to be written.
@@ -187,18 +169,21 @@ def cleanup():
         logger.warning("Ray did not shut down properly.")
 
 
-def all_processes_alive(exclude=[]):
+def all_processes_alive(exclude=None):
     """Check if all of the processes are still alive.
 
     Args:
         exclude: Don't check the processes whose types are in this list.
     """
+
+    if exclude is None:
+        exclude = []
     for process_type, processes in all_processes.items():
         # Note that p.poll() returns the exit code that the process exited
         # with, so an exit code of None indicates that the process is still
         # alive.
         processes_alive = [p.poll() is None for p in processes]
-        if (not all(processes_alive) and process_type not in exclude):
+        if not all(processes_alive) and process_type not in exclude:
             logger.warning(
                 "A process of type {} has died.".format(process_type))
             return False
@@ -258,7 +243,10 @@ def get_node_ip_address(address="8.8.8.8:53"):
     return node_ip_address
 
 
-def record_log_files_in_redis(redis_address, node_ip_address, log_files):
+def record_log_files_in_redis(redis_address,
+                              node_ip_address,
+                              log_files,
+                              password=None):
     """Record in Redis that a new log file has been created.
 
     This is used so that each log monitor can check Redis and figure out which
@@ -270,23 +258,24 @@ def record_log_files_in_redis(redis_address, node_ip_address, log_files):
             on.
         log_files: A list of file handles for the log files. If one of the file
             handles is None, we ignore it.
+        password (str): The password of the redis server.
     """
     for log_file in log_files:
         if log_file is not None:
             redis_ip_address, redis_port = redis_address.split(":")
             redis_client = redis.StrictRedis(
-                host=redis_ip_address, port=redis_port)
+                host=redis_ip_address, port=redis_port, password=password)
             # The name of the key storing the list of log filenames for this IP
             # address.
             log_file_list_key = "LOG_FILENAMES:{}".format(node_ip_address)
             redis_client.rpush(log_file_list_key, log_file.name)
 
 
-def create_redis_client(redis_address):
+def create_redis_client(redis_address, password=None):
     """Create a Redis client.
 
     Args:
-        The IP address and port of the Redis server.
+        The IP address, port, and password of the Redis server.
 
     Returns:
         A Redis client.
@@ -294,10 +283,14 @@ def create_redis_client(redis_address):
     redis_ip_address, redis_port = redis_address.split(":")
     # For this command to work, some other client (on the same machine
     # as Redis) must have run "CONFIG SET protected-mode no".
-    return redis.StrictRedis(host=redis_ip_address, port=int(redis_port))
+    return redis.StrictRedis(
+        host=redis_ip_address, port=int(redis_port), password=password)
 
 
-def wait_for_redis_to_start(redis_ip_address, redis_port, num_retries=5):
+def wait_for_redis_to_start(redis_ip_address,
+                            redis_port,
+                            password=None,
+                            num_retries=5):
     """Wait for a Redis server to be available.
 
     This is accomplished by creating a Redis client and sending a random
@@ -306,13 +299,15 @@ def wait_for_redis_to_start(redis_ip_address, redis_port, num_retries=5):
     Args:
         redis_ip_address (str): The IP address of the redis server.
         redis_port (int): The port of the redis server.
+        password (str): The password of the redis server.
         num_retries (int): The number of times to try connecting with redis.
             The client will sleep for one second between attempts.
 
     Raises:
         Exception: An exception is raised if we could not connect with Redis.
     """
-    redis_client = redis.StrictRedis(host=redis_ip_address, port=redis_port)
+    redis_client = redis.StrictRedis(
+        host=redis_ip_address, port=redis_port, password=password)
     # Wait for the Redis server to start.
     counter = 0
     while counter < num_retries:
@@ -322,7 +317,7 @@ def wait_for_redis_to_start(redis_ip_address, redis_port, num_retries=5):
                 "Waiting for redis server at {}:{} to respond...".format(
                     redis_ip_address, redis_port))
             redis_client.client_list()
-        except redis.ConnectionError as e:
+        except redis.ConnectionError:
             # Wait a little bit.
             time.sleep(1)
             logger.info("Failed to connect to the redis server, retrying.")
@@ -358,7 +353,7 @@ def _compute_version_info():
     ray_version = ray.__version__
     python_version = ".".join(map(str, sys.version_info[:3]))
     pyarrow_version = pyarrow.__version__
-    return (ray_version, python_version, pyarrow_version)
+    return ray_version, python_version, pyarrow_version
 
 
 def _put_version_info_in_redis(redis_client):
@@ -417,12 +412,12 @@ def start_redis(node_ip_address,
                 redis_shard_ports=None,
                 num_redis_shards=1,
                 redis_max_clients=None,
-                use_raylet=False,
                 redirect_output=False,
                 redirect_worker_output=False,
                 cleanup=True,
-                protected_mode=False,
-                use_credis=None):
+                password=None,
+                use_credis=None,
+                redis_max_memory=None):
     """Start the Redis global state store.
 
     Args:
@@ -437,8 +432,6 @@ def start_redis(node_ip_address,
             shard.
         redis_max_clients: If this is provided, Ray will attempt to configure
             Redis with this maxclients number.
-        use_raylet: True if the new raylet code path should be used. This is
-            not supported yet.
         redirect_output (bool): True if output should be redirected to a file
             and false otherwise.
         redirect_worker_output (bool): True if worker output should be
@@ -448,16 +441,21 @@ def start_redis(node_ip_address,
             then all Redis processes started by this method will be killed by
             services.cleanup() when the Python process that imported services
             exits.
+        password (str): Prevents external clients without the password
+            from connecting to Redis if provided.
         use_credis: If True, additionally load the chain-replicated libraries
             into the redis servers.  Defaults to None, which means its value is
             set by the presence of "RAY_USE_NEW_GCS" in os.environ.
+        redis_max_memory: The max amount of memory (in bytes) to allow redis
+            to use, or None for no limit. Once the limit is exceeded, redis
+            will start LRU eviction of entries. This only applies to the
+            sharded redis tables (task and object tables).
 
     Returns:
         A tuple of the address for the primary Redis shard and a list of
             addresses for the remaining shards.
     """
-    redis_stdout_file, redis_stderr_file = new_log_files(
-        "redis", redirect_output)
+    redis_stdout_file, redis_stderr_file = new_redis_log_file(redirect_output)
 
     if redis_shard_ports is None:
         redis_shard_ports = num_redis_shards * [None]
@@ -467,6 +465,13 @@ def start_redis(node_ip_address,
 
     if use_credis is None:
         use_credis = ("RAY_USE_NEW_GCS" in os.environ)
+    if use_credis and password is not None:
+        # TODO(pschafhalter) remove this once credis supports
+        # authenticating Redis ports
+        raise Exception("Setting the `redis_password` argument is not "
+                        "supported in credis. To run Ray with "
+                        "password-protected Redis ports, ensure that "
+                        "the environment variable `RAY_USE_NEW_GCS=off`.")
     if not use_credis:
         assigned_port, _ = _start_redis_instance(
             node_ip_address=node_ip_address,
@@ -475,7 +480,8 @@ def start_redis(node_ip_address,
             stdout_file=redis_stdout_file,
             stderr_file=redis_stderr_file,
             cleanup=cleanup,
-            protected_mode=protected_mode)
+            password=password,
+            redis_max_memory=None)
     else:
         assigned_port, _ = _start_redis_instance(
             node_ip_address=node_ip_address,
@@ -484,25 +490,22 @@ def start_redis(node_ip_address,
             stdout_file=redis_stdout_file,
             stderr_file=redis_stderr_file,
             cleanup=cleanup,
-            protected_mode=protected_mode,
             executable=CREDIS_EXECUTABLE,
             # It is important to load the credis module BEFORE the ray module,
             # as the latter contains an extern declaration that the former
             # supplies.
-            modules=[CREDIS_MASTER_MODULE, REDIS_MODULE])
+            modules=[CREDIS_MASTER_MODULE, REDIS_MODULE],
+            password=password,
+            redis_max_memory=None)
     if port is not None:
         assert assigned_port == port
     port = assigned_port
     redis_address = address(node_ip_address, port)
 
-    redis_client = redis.StrictRedis(host=node_ip_address, port=port)
-
-    # Store whether we're using the raylet code path or not.
-    redis_client.set("UseRaylet", 1 if use_raylet else 0)
-
     # Register the number of Redis shards in the primary shard, so that clients
     # know how many redis shards to expect under RedisShards.
-    primary_redis_client = redis.StrictRedis(host=node_ip_address, port=port)
+    primary_redis_client = redis.StrictRedis(
+        host=node_ip_address, port=port, password=password)
     primary_redis_client.set("NumRedisShards", str(num_redis_shards))
 
     # Put the redirect_worker_output bool in the Redis shard so that workers
@@ -517,8 +520,8 @@ def start_redis(node_ip_address,
     # prefixed by "redis-<shard number>".
     redis_shards = []
     for i in range(num_redis_shards):
-        redis_stdout_file, redis_stderr_file = new_log_files(
-            "redis-{}".format(i), redirect_output)
+        redis_stdout_file, redis_stderr_file = new_redis_log_file(
+            redirect_output, shard_number=i)
         if not use_credis:
             redis_shard_port, _ = _start_redis_instance(
                 node_ip_address=node_ip_address,
@@ -527,7 +530,8 @@ def start_redis(node_ip_address,
                 stdout_file=redis_stdout_file,
                 stderr_file=redis_stderr_file,
                 cleanup=cleanup,
-                protected_mode=protected_mode)
+                password=password,
+                redis_max_memory=redis_max_memory)
         else:
             assert num_redis_shards == 1, \
                 "For now, RAY_USE_NEW_GCS supports 1 shard, and credis "\
@@ -539,12 +543,13 @@ def start_redis(node_ip_address,
                 stdout_file=redis_stdout_file,
                 stderr_file=redis_stderr_file,
                 cleanup=cleanup,
-                protected_mode=protected_mode,
+                password=password,
                 executable=CREDIS_EXECUTABLE,
                 # It is important to load the credis module BEFORE the ray
                 # module, as the latter contains an extern declaration that the
                 # former supplies.
-                modules=[CREDIS_MEMBER_MODULE, REDIS_MODULE])
+                modules=[CREDIS_MEMBER_MODULE, REDIS_MODULE],
+                redis_max_memory=redis_max_memory)
 
         if redis_shard_ports[i] is not None:
             assert redis_shard_port == redis_shard_ports[i]
@@ -555,7 +560,7 @@ def start_redis(node_ip_address,
 
     if use_credis:
         shard_client = redis.StrictRedis(
-            host=node_ip_address, port=redis_shard_port)
+            host=node_ip_address, port=redis_shard_port, password=password)
         # Configure the chain state.
         primary_redis_client.execute_command("MASTER.ADD", node_ip_address,
                                              redis_shard_port)
@@ -565,22 +570,6 @@ def start_redis(node_ip_address,
     return redis_address, redis_shards
 
 
-def _make_temp_redis_config(node_ip_address):
-    """Create a configuration file for Redis.
-
-    Args:
-        node_ip_address: The IP address of this node. This should not be
-            127.0.0.1.
-    """
-    redis_config_name = "/tmp/redis_conf{}".format(random_name())
-    with open(redis_config_name, 'w') as f:
-        # This allows redis clients on the same machine to connect using the
-        # node's IP address as opposed to just 127.0.0.1. This is only relevant
-        # when the server is in protected mode.
-        f.write("bind 127.0.0.1 {}".format(node_ip_address))
-    return redis_config_name
-
-
 def _start_redis_instance(node_ip_address="127.0.0.1",
                           port=None,
                           redis_max_clients=None,
@@ -588,9 +577,10 @@ def _start_redis_instance(node_ip_address="127.0.0.1",
                           stdout_file=None,
                           stderr_file=None,
                           cleanup=True,
-                          protected_mode=False,
+                          password=None,
                           executable=REDIS_EXECUTABLE,
-                          modules=None):
+                          modules=None,
+                          redis_max_memory=None):
     """Start a single Redis server.
 
     Args:
@@ -608,14 +598,15 @@ def _start_redis_instance(node_ip_address="127.0.0.1",
         cleanup (bool): True if using Ray in local mode. If cleanup is true,
             then this process will be killed by serices.cleanup() when the
             Python process that imported services exits.
-        protected_mode: True if we should start the Redis server in protected
-            mode. This will prevent clients on other machines from connecting
-            and is only used when the Redis servers are started via ray.init()
-            as opposed to ray start.
+        password (str): Prevents external clients without the password
+            from connecting to Redis if provided.
         executable (str): Full path tho the redis-server executable.
         modules (list of str): A list of pathnames, pointing to the redis
             module(s) that will be loaded in this redis server.  If None, load
             the default Ray redis module.
+        redis_max_memory: The max amount of memory (in bytes) to allow redis
+            to use, or None for no limit. Once the limit is exceeded, redis
+            will start LRU eviction of entries.
 
     Returns:
         A tuple of the port used by Redis and a handle to the process that was
@@ -637,9 +628,6 @@ def _start_redis_instance(node_ip_address="127.0.0.1",
     else:
         port = new_port()
 
-    if protected_mode:
-        redis_config_filename = _make_temp_redis_config(node_ip_address)
-
     load_module_args = []
     for module in modules:
         load_module_args += ["--loadmodule", module]
@@ -650,8 +638,8 @@ def _start_redis_instance(node_ip_address="127.0.0.1",
 
         # Construct the command to start the Redis server.
         command = [executable]
-        if protected_mode:
-            command += [redis_config_filename]
+        if password:
+            command += ["--requirepass", password]
         command += (
             ["--port", str(port), "--loglevel", "warning"] + load_module_args)
 
@@ -670,17 +658,25 @@ def _start_redis_instance(node_ip_address="127.0.0.1",
             stdout_file.name, stderr_file.name))
 
     # Create a Redis client just for configuring Redis.
-    redis_client = redis.StrictRedis(host="127.0.0.1", port=port)
+    redis_client = redis.StrictRedis(
+        host="127.0.0.1", port=port, password=password)
     # Wait for the Redis server to start.
-    wait_for_redis_to_start("127.0.0.1", port)
+    wait_for_redis_to_start("127.0.0.1", port, password=password)
     # Configure Redis to generate keyspace notifications. TODO(rkn): Change
     # this to only generate notifications for the export keys.
     redis_client.config_set("notify-keyspace-events", "Kl")
 
     # Configure Redis to not run in protected mode so that processes on other
     # hosts can connect to it. TODO(rkn): Do this in a more secure way.
-    if not protected_mode:
-        redis_client.config_set("protected-mode", "no")
+    redis_client.config_set("protected-mode", "no")
+
+    # Discard old task and object metadata.
+    if redis_max_memory is not None:
+        redis_client.config_set("maxmemory", str(redis_max_memory))
+        redis_client.config_set("maxmemory-policy", "allkeys-lru")
+        redis_client.config_set("maxmemory-samples", "10")
+        logger.info("Starting Redis shard with {} GB max memory.".format(
+            round(redis_max_memory / 1e9, 2)))
 
     # If redis_max_clients is provided, attempt to raise the number of maximum
     # number of Redis clients.
@@ -717,8 +713,9 @@ def _start_redis_instance(node_ip_address="127.0.0.1",
     redis_client.set("redis_start_time", time.time())
     # Record the log files in Redis.
     record_log_files_in_redis(
-        address(node_ip_address, port), node_ip_address,
-        [stdout_file, stderr_file])
+        address(node_ip_address, port),
+        node_ip_address, [stdout_file, stderr_file],
+        password=password)
     return port, p
 
 
@@ -726,7 +723,8 @@ def start_log_monitor(redis_address,
                       node_ip_address,
                       stdout_file=None,
                       stderr_file=None,
-                      cleanup=cleanup):
+                      cleanup=cleanup,
+                      redis_password=None):
     """Start a log monitor process.
 
     Args:
@@ -740,50 +738,23 @@ def start_log_monitor(redis_address,
         cleanup (bool): True if using Ray in local mode. If cleanup is true,
             then this process will be killed by services.cleanup() when the
             Python process that imported services exits.
+        redis_password (str): The password of the redis server.
     """
     log_monitor_filepath = os.path.join(
         os.path.dirname(os.path.abspath(__file__)), "log_monitor.py")
-    p = subprocess.Popen(
-        [
-            sys.executable, "-u", log_monitor_filepath, "--redis-address",
-            redis_address, "--node-ip-address", node_ip_address
-        ],
-        stdout=stdout_file,
-        stderr=stderr_file)
+    command = [
+        sys.executable, "-u", log_monitor_filepath, "--redis-address",
+        redis_address, "--node-ip-address", node_ip_address
+    ]
+    if redis_password:
+        command += ["--redis-password", redis_password]
+    p = subprocess.Popen(command, stdout=stdout_file, stderr=stderr_file)
     if cleanup:
         all_processes[PROCESS_TYPE_LOG_MONITOR].append(p)
-    record_log_files_in_redis(redis_address, node_ip_address,
-                              [stdout_file, stderr_file])
-
-
-def start_global_scheduler(redis_address,
-                           node_ip_address,
-                           stdout_file=None,
-                           stderr_file=None,
-                           cleanup=True):
-    """Start a global scheduler process.
-
-    Args:
-        redis_address (str): The address of the Redis instance.
-        node_ip_address: The IP address of the node that this scheduler will
-            run on.
-        stdout_file: A file handle opened for writing to redirect stdout to. If
-            no redirection should happen, then this should be None.
-        stderr_file: A file handle opened for writing to redirect stderr to. If
-            no redirection should happen, then this should be None.
-        cleanup (bool): True if using Ray in local mode. If cleanup is true,
-            then this process will be killed by services.cleanup() when the
-            Python process that imported services exits.
-    """
-    p = global_scheduler.start_global_scheduler(
+    record_log_files_in_redis(
         redis_address,
-        node_ip_address,
-        stdout_file=stdout_file,
-        stderr_file=stderr_file)
-    if cleanup:
-        all_processes[PROCESS_TYPE_GLOBAL_SCHEDULER].append(p)
-    record_log_files_in_redis(redis_address, node_ip_address,
-                              [stdout_file, stderr_file])
+        node_ip_address, [stdout_file, stderr_file],
+        password=redis_password)
 
 
 def start_ui(redis_address, stdout_file=None, stderr_file=None, cleanup=True):
@@ -799,15 +770,7 @@ def start_ui(redis_address, stdout_file=None, stderr_file=None, cleanup=True):
             then this process will be killed by services.cleanup() when the
             Python process that imported services exits.
     """
-    new_env = os.environ.copy()
-    notebook_filepath = os.path.join(
-        os.path.dirname(os.path.abspath(__file__)), "WebUI.ipynb")
-    # We copy the notebook file so that the original doesn't get modified by
-    # the user.
-    random_ui_id = random.randint(0, 100000)
-    new_notebook_filepath = "/tmp/raylogs/ray_ui{}.ipynb".format(random_ui_id)
-    new_notebook_directory = os.path.dirname(new_notebook_filepath)
-    shutil.copy(notebook_filepath, new_notebook_filepath)
+
     port = 8888
     while True:
         try:
@@ -821,7 +784,8 @@ def start_ui(redis_address, stdout_file=None, stderr_file=None, cleanup=True):
     new_env["REDIS_ADDRESS"] = redis_address
     # We generate the token used for authentication ourselves to avoid
     # querying the jupyter server.
-    token = ray.utils.decode(binascii.hexlify(os.urandom(24)))
+    new_notebook_directory, webui_url, token = (
+        get_ipython_notebook_path(port))
     # The --ip=0.0.0.0 flag is intended to enable connecting to a notebook
     # running within a docker container (from the outside).
     command = [
@@ -847,21 +811,17 @@ def start_ui(redis_address, stdout_file=None, stderr_file=None, cleanup=True):
     else:
         if cleanup:
             all_processes[PROCESS_TYPE_WEB_UI].append(ui_process)
-        webui_url = ("http://localhost:{}/notebooks/ray_ui{}.ipynb?token={}"
-                     .format(port, random_ui_id, token))
         logger.info("\n" + "=" * 70)
         logger.info("View the web UI at {}".format(webui_url))
         logger.info("=" * 70 + "\n")
         return webui_url
 
 
-def check_and_update_resources(resources, use_raylet):
+def check_and_update_resources(resources):
     """Sanity check a resource dictionary and add sensible defaults.
 
     Args:
         resources: A dictionary mapping resource names to resource quantities.
-        use_raylet: True if we are using the raylet code path and false
-            otherwise.
 
     Returns:
         A new resource dictionary.
@@ -900,86 +860,30 @@ def check_and_update_resources(resources, use_raylet):
                 and not resource_quantity.is_integer()):
             raise ValueError("Resource quantities must all be whole numbers.")
 
-        if (use_raylet and
-                resource_quantity > ray.ray_constants.MAX_RESOURCE_QUANTITY):
+        if resource_quantity > ray.ray_constants.MAX_RESOURCE_QUANTITY:
             raise ValueError("Resource quantities must be at most {}.".format(
                 ray.ray_constants.MAX_RESOURCE_QUANTITY))
 
     return resources
 
 
-def start_local_scheduler(redis_address,
-                          node_ip_address,
-                          plasma_store_name,
-                          plasma_manager_name,
-                          worker_path,
-                          plasma_address=None,
-                          stdout_file=None,
-                          stderr_file=None,
-                          cleanup=True,
-                          resources=None,
-                          num_workers=0):
-    """Start a local scheduler process.
-
-    Args:
-        redis_address (str): The address of the Redis instance.
-        node_ip_address (str): The IP address of the node that this local
-            scheduler is running on.
-        plasma_store_name (str): The name of the plasma store socket to connect
-            to.
-        plasma_manager_name (str): The name of the plasma manager socket to
-            connect to.
-        worker_path (str): The path of the script to use when the local
-            scheduler starts up new workers.
-        stdout_file: A file handle opened for writing to redirect stdout to. If
-            no redirection should happen, then this should be None.
-        stderr_file: A file handle opened for writing to redirect stderr to. If
-            no redirection should happen, then this should be None.
-        cleanup (bool): True if using Ray in local mode. If cleanup is true,
-            then this process will be killed by serices.cleanup() when the
-            Python process that imported services exits.
-        resources: A dictionary mapping the name of a resource to the available
-            quantity of that resource.
-        num_workers (int): The number of workers that the local scheduler
-            should start.
-
-    Return:
-        The name of the local scheduler socket.
-    """
-    resources = check_and_update_resources(resources, False)
-
-    logger.info("Starting local scheduler with the following resources: {}."
-                .format(resources))
-    local_scheduler_name, p = ray.local_scheduler.start_local_scheduler(
-        plasma_store_name,
-        plasma_manager_name,
-        worker_path=worker_path,
-        node_ip_address=node_ip_address,
-        redis_address=redis_address,
-        plasma_address=plasma_address,
-        use_profiler=RUN_LOCAL_SCHEDULER_PROFILER,
-        stdout_file=stdout_file,
-        stderr_file=stderr_file,
-        static_resources=resources,
-        num_workers=num_workers)
-    if cleanup:
-        all_processes[PROCESS_TYPE_LOCAL_SCHEDULER].append(p)
-    record_log_files_in_redis(redis_address, node_ip_address,
-                              [stdout_file, stderr_file])
-    return local_scheduler_name
-
-
 def start_raylet(redis_address,
                  node_ip_address,
+                 raylet_name,
                  plasma_store_name,
                  worker_path,
                  resources=None,
+                 object_manager_port=None,
+                 node_manager_port=None,
                  num_workers=0,
                  use_valgrind=False,
                  use_profiler=False,
                  stdout_file=None,
                  stderr_file=None,
-                 cleanup=True):
+                 cleanup=True,
+                 config=None,
+                 redis_password=None,
+                 collect_profiling_data=True):
     """Start a raylet, which is a combined local scheduler and object manager.
 
     Args:
@@ -988,8 +892,16 @@ def start_raylet(redis_address,
             scheduler is running on.
         plasma_store_name (str): The name of the plasma store socket to connect
             to.
+        raylet_name (str): The name of the raylet socket to create.
         worker_path (str): The path of the script to use when the local
             scheduler starts up new workers.
+        resources: The resources that this raylet has.
+        object_manager_port (int): The port to use for the object manager. If
+            this is not provided, we will use 0 and the object manager will
+            choose its own port.
+        node_manager_port (int): The port to use for the node manager. If
+            this is not provided, we will use 0 and the node manager will
+            choose its own port.
         use_valgrind (bool): True if the raylet should be started inside
             of valgrind. If this is True, use_profiler must be False.
         use_profiler (bool): True if the raylet should be started inside
@@ -1001,14 +913,21 @@ def start_raylet(redis_address,
         cleanup (bool): True if using Ray in local mode. If cleanup is true,
             then this process will be killed by serices.cleanup() when the
             Python process that imported services exits.
+        config (dict|None): Optional Raylet configuration that will
+            override defaults in RayConfig.
+        redis_password (str): The password of the redis server.
+        collect_profiling_data: Whether to collect profiling data from workers.
 
     Returns:
         The raylet socket name.
     """
+    config = config or {}
+    config_str = ",".join(["{},{}".format(*kv) for kv in config.items()])
+
     if use_valgrind and use_profiler:
         raise Exception("Cannot use valgrind and profiler at the same time.")
 
-    static_resources = check_and_update_resources(resources, True)
+    static_resources = check_and_update_resources(resources)
 
     # Limit the number of workers that can be started in parallel by the
     # raylet. However, make sure it is at least 1.
@@ -1016,36 +935,52 @@ def start_raylet(redis_address,
         1, min(multiprocessing.cpu_count(), static_resources["CPU"]))
 
     # Format the resource argument in a form like 'CPU,1.0,GPU,0,Custom,3'.
-    resource_argument = ",".join([
-        "{},{}".format(resource_name, resource_value)
-        for resource_name, resource_value in zip(static_resources.keys(),
-                                                 static_resources.values())
-    ])
+    resource_argument = ",".join(
+        ["{},{}".format(*kv) for kv in static_resources.items()])
 
     gcs_ip_address, gcs_port = redis_address.split(":")
-    raylet_name = "/tmp/raylet{}".format(random_name())
 
     # Create the command that the Raylet will use to start workers.
     start_worker_command = ("{} {} "
                             "--node-ip-address={} "
                             "--object-store-name={} "
                             "--raylet-name={} "
-                            "--redis-address={}".format(
+                            "--redis-address={} "
+                            "--collect-profiling-data={} "
+                            "--temp-dir={}".format(
                                 sys.executable, worker_path, node_ip_address,
-                                plasma_store_name, raylet_name, redis_address))
+                                plasma_store_name, raylet_name, redis_address,
+                                "1" if collect_profiling_data else "0",
+                                get_temp_root()))
+    if redis_password:
+        start_worker_command += " --redis-password {}".format(redis_password)
+
+    # If the object manager port is None, then use 0 to cause the object
+    # manager to choose its own port.
+    if object_manager_port is None:
+        object_manager_port = 0
+    # If the node manager port is None, then use 0 to cause the node manager
+    # to choose its own port.
+    if node_manager_port is None:
+        node_manager_port = 0
 
     command = [
         RAYLET_EXECUTABLE,
         raylet_name,
         plasma_store_name,
+        str(object_manager_port),
+        str(node_manager_port),
         node_ip_address,
         gcs_ip_address,
         gcs_port,
         str(num_workers),
         str(maximum_startup_concurrency),
         resource_argument,
+        config_str,
         start_worker_command,
         "",  # Worker command for Java, not needed for Python.
+        redis_password or "",
+        get_temp_root(),
     ]
 
     if use_valgrind:
@@ -1062,29 +997,114 @@ def start_raylet(redis_address,
             ["valgrind", "--tool=callgrind"] + command,
             stdout=stdout_file,
             stderr=stderr_file)
+    elif "RAYLET_PERFTOOLS_PATH" in os.environ:
+        modified_env = os.environ.copy()
+        modified_env["LD_PRELOAD"] = os.environ["RAYLET_PERFTOOLS_PATH"]
+        modified_env["CPUPROFILE"] = os.environ["RAYLET_PERFTOOLS_LOGFILE"]
+        pid = subprocess.Popen(
+            command, stdout=stdout_file, stderr=stderr_file, env=modified_env)
     else:
         pid = subprocess.Popen(command, stdout=stdout_file, stderr=stderr_file)
 
     if cleanup:
         all_processes[PROCESS_TYPE_RAYLET].append(pid)
-    record_log_files_in_redis(redis_address, node_ip_address,
-                              [stdout_file, stderr_file])
+    record_log_files_in_redis(
+        redis_address,
+        node_ip_address, [stdout_file, stderr_file],
+        password=redis_password)
 
     return raylet_name
 
 
+def determine_plasma_store_config(object_store_memory=None,
+                                  plasma_directory=None,
+                                  huge_pages=False):
+    """Figure out how to configure the plasma object store.
+
+    This will determine which directory to use for the plasma store (e.g.,
+    /tmp or /dev/shm) and how much memory to start the store with. On Linux,
+    we will try to use /dev/shm unless the shared memory file system is too
+    small, in which case we will fall back to /tmp. If any of the object store
+    memory or plasma directory parameters are specified by the user, then those
+    values will be preserved.
+
+    Args:
+        object_store_memory (int): The user-specified object store memory
+            parameter.
+        plasma_directory (str): The user-specified plasma directory parameter.
+        huge_pages (bool): The user-specified huge pages parameter.
+
+    Returns:
+        A tuple of the object store memory to use and the plasma directory to
+            use. If either of these values is specified by the user, then that
+            value will be preserved.
+    """
+    system_memory = ray.utils.get_system_memory()
+
+    # Choose a default object store size.
+    if object_store_memory is None:
+        object_store_memory = int(system_memory * 0.4)
+        # Cap memory to avoid memory waste and perf issues on large nodes
+        if object_store_memory > MAX_DEFAULT_MEM:
+            logger.warning(
+                "Warning: Capping object memory store to {}GB. ".format(
+                    MAX_DEFAULT_MEM // 1e9) +
+                "To increase this further, specify `object_store_memory` "
+                "when calling ray.init() or ray start.")
+            object_store_memory = MAX_DEFAULT_MEM
+
+    # Determine which directory to use. By default, use /tmp on MacOS and
+    # /dev/shm on Linux, unless the shared-memory file system is too small,
+    # in which case we default to /tmp on Linux.
+    if plasma_directory is None:
+        if sys.platform == "linux" or sys.platform == "linux2":
+            shm_avail = ray.utils.get_shared_memory_bytes()
+            # Compare the requested memory size to the memory available in
+            # /dev/shm.
+            if shm_avail > object_store_memory:
+                plasma_directory = "/dev/shm"
+            else:
+                plasma_directory = "/tmp"
+                logger.warning(
+                    "WARNING: The object store is using /tmp instead of "
+                    "/dev/shm because /dev/shm has only {} bytes available. "
+                    "This may slow down performance! You may be able to free "
+                    "up space by deleting files in /dev/shm or terminating "
+                    "any running plasma_store_server processes. If you are "
+                    "inside a Docker container, you may need to pass an "
+                    "argument with the flag '--shm-size' to 'docker run'."
+                    .format(shm_avail))
+        else:
+            plasma_directory = "/tmp"
+
+        # Do some sanity checks.
+        if object_store_memory > system_memory:
+            raise Exception(
+                "The requested object store memory size is greater "
+                "than the total available memory.")
+    else:
+        plasma_directory = os.path.abspath(plasma_directory)
+        logger.warning("WARNING: object_store_memory is not verified when "
+                       "plasma_directory is set.")
+
+    if not os.path.isdir(plasma_directory):
+        raise Exception("The file {} does not exist or is not a directory."
+                        .format(plasma_directory))
+
+    return object_store_memory, plasma_directory
+
+
 def start_plasma_store(node_ip_address,
                        redis_address,
                        object_manager_port=None,
                        store_stdout_file=None,
                        store_stderr_file=None,
-                       manager_stdout_file=None,
-                       manager_stderr_file=None,
-                       objstore_memory=None,
+                       object_store_memory=None,
                        cleanup=True,
                        plasma_directory=None,
                        huge_pages=False,
-                       use_raylet=False):
+                       plasma_store_socket_name=None,
+                       redis_password=None):
     """This method starts an object store process.
 
     Args:
@@ -1097,14 +1117,8 @@ def start_plasma_store(node_ip_address,
             to. If no redirection should happen, then this should be None.
         store_stderr_file: A file handle opened for writing to redirect stderr
             to. If no redirection should happen, then this should be None.
-        manager_stdout_file: A file handle opened for writing to redirect
-            stdout to. If no redirection should happen, then this should be
-            None.
-        manager_stderr_file: A file handle opened for writing to redirect
-            stderr to. If no redirection should happen, then this should be
-            None.
-        objstore_memory: The amount of memory (in bytes) to start the object
-            store with.
+        object_store_memory: The amount of memory (in bytes) to start the
+            object store with.
         cleanup (bool): True if using Ray in local mode. If cleanup is true,
             then this process will be killed by serices.cleanup() when the
             Python process that imported services exits.
@@ -1112,97 +1126,40 @@ def start_plasma_store(node_ip_address,
             be created.
         huge_pages: Boolean flag indicating whether to start the Object
             Store with hugetlbfs support. Requires plasma_directory.
-        use_raylet: True if the new raylet code path should be used. This is
-            not supported yet.
+        redis_password (str): The password of the redis server.
 
     Return:
-        A tuple of the Plasma store socket name, the Plasma manager socket
-            name, and the plasma manager port.
+        The Plasma store socket name.
     """
-    if objstore_memory is None:
-        # Compute a fraction of the system memory for the Plasma store to use.
-        system_memory = ray.utils.get_system_memory()
-        if sys.platform == "linux" or sys.platform == "linux2":
-            # On linux we use /dev/shm, its size is half the size of the
-            # physical memory. To not overflow it, we set the plasma memory
-            # limit to 0.4 times the size of the physical memory.
-            objstore_memory = int(system_memory * 0.4)
-            # Compare the requested memory size to the memory available in
-            # /dev/shm.
-            shm_fd = os.open("/dev/shm", os.O_RDONLY)
-            try:
-                shm_fs_stats = os.fstatvfs(shm_fd)
-                # The value shm_fs_stats.f_bsize is the block size and the
-                # value shm_fs_stats.f_bavail is the number of available
-                # blocks.
-                shm_avail = shm_fs_stats.f_bsize * shm_fs_stats.f_bavail
-                if objstore_memory > shm_avail:
-                    logger.warning(
-                        "Warning: Reducing object store memory because "
-                        "/dev/shm has only {} bytes available. You may be "
-                        "able to free up space by deleting files in "
-                        "/dev/shm. If you are inside a Docker container, "
-                        "you may need to pass an argument with the flag "
-                        "'--shm-size' to 'docker run'.".format(shm_avail))
-                    objstore_memory = int(shm_avail * 0.8)
-            finally:
-                os.close(shm_fd)
-        else:
-            objstore_memory = int(system_memory * 0.8)
+    object_store_memory, plasma_directory = determine_plasma_store_config(
+        object_store_memory, plasma_directory, huge_pages)
+
+    # Print the object store memory using two decimal places.
+    object_store_memory_str = (object_store_memory / 10**7) / 10**2
+    logger.info("Starting the Plasma object store with {} GB memory "
+                "using {}.".format(object_store_memory_str, plasma_directory))
     # Start the Plasma store.
-    logger.info("Starting the Plasma object store with {0:.2f} GB memory."
-                .format(objstore_memory // 10**9))
     plasma_store_name, p1 = ray.plasma.start_plasma_store(
-        plasma_store_memory=objstore_memory,
+        plasma_store_memory=object_store_memory,
         use_profiler=RUN_PLASMA_STORE_PROFILER,
         stdout_file=store_stdout_file,
         stderr_file=store_stderr_file,
         plasma_directory=plasma_directory,
-        huge_pages=huge_pages)
-    # Start the plasma manager.
-    if not use_raylet:
-        if object_manager_port is not None:
-            (plasma_manager_name, p2,
-             plasma_manager_port) = ray.plasma.start_plasma_manager(
-                 plasma_store_name,
-                 redis_address,
-                 plasma_manager_port=object_manager_port,
-                 node_ip_address=node_ip_address,
-                 num_retries=1,
-                 run_profiler=RUN_PLASMA_MANAGER_PROFILER,
-                 stdout_file=manager_stdout_file,
-                 stderr_file=manager_stderr_file)
-            assert plasma_manager_port == object_manager_port
-        else:
-            (plasma_manager_name, p2,
-             plasma_manager_port) = ray.plasma.start_plasma_manager(
-                 plasma_store_name,
-                 redis_address,
-                 node_ip_address=node_ip_address,
-                 run_profiler=RUN_PLASMA_MANAGER_PROFILER,
-                 stdout_file=manager_stdout_file,
-                 stderr_file=manager_stderr_file)
-    else:
-        plasma_manager_port = None
-        plasma_manager_name = None
+        huge_pages=huge_pages,
+        socket_name=plasma_store_socket_name)
 
     if cleanup:
         all_processes[PROCESS_TYPE_PLASMA_STORE].append(p1)
-    record_log_files_in_redis(redis_address, node_ip_address,
-                              [store_stdout_file, store_stderr_file])
-    if not use_raylet:
-        if cleanup:
-            all_processes[PROCESS_TYPE_PLASMA_MANAGER].append(p2)
-        record_log_files_in_redis(redis_address, node_ip_address,
-                                  [manager_stdout_file, manager_stderr_file])
+    record_log_files_in_redis(
+        redis_address,
+        node_ip_address, [store_stdout_file, store_stderr_file],
+        password=redis_password)
 
-    return ObjectStoreAddress(plasma_store_name, plasma_manager_name,
-                              plasma_manager_port)
+    return plasma_store_name
 
 
 def start_worker(node_ip_address,
                  object_store_name,
-                 object_store_manager_name,
                  local_scheduler_name,
                  redis_address,
                  worker_path,
@@ -1215,7 +1172,6 @@ def start_worker(node_ip_address,
         node_ip_address (str): The IP address of the node that this worker is
             running on.
         object_store_name (str): The name of the object store.
-        object_store_manager_name (str): The name of the object store manager.
         local_scheduler_name (str): The name of the local scheduler.
         redis_address (str): The address that the Redis server is listening on.
         worker_path (str): The path of the source code which the worker process
@@ -1233,9 +1189,8 @@ def start_worker(node_ip_address,
         sys.executable, "-u", worker_path,
         "--node-ip-address=" + node_ip_address,
         "--object-store-name=" + object_store_name,
-        "--object-store-manager-name=" + object_store_manager_name,
-        "--local-scheduler-name=" + local_scheduler_name,
-        "--redis-address=" + str(redis_address)
+        "--redis-address=" + str(redis_address),
+        "--temp-dir=" + get_temp_root()
     ]
     p = subprocess.Popen(command, stdout=stdout_file, stderr=stderr_file)
     if cleanup:
@@ -1249,7 +1204,8 @@ def start_monitor(redis_address,
                   stdout_file=None,
                   stderr_file=None,
                   cleanup=True,
-                  autoscaling_config=None):
+                  autoscaling_config=None,
+                  redis_password=None):
     """Run a process to monitor the other processes.
 
     Args:
@@ -1265,6 +1221,7 @@ def start_monitor(redis_address,
             Python process that imported services exits. This is True by
             default.
         autoscaling_config: path to autoscaling config file.
+        redis_password (str): The password of the redis server.
     """
     monitor_path = os.path.join(
         os.path.dirname(os.path.abspath(__file__)), "monitor.py")
@@ -1274,17 +1231,23 @@ def start_monitor(redis_address,
     ]
     if autoscaling_config:
         command.append("--autoscaling-config=" + str(autoscaling_config))
+    if redis_password:
+        command.append("--redis-password=" + redis_password)
     p = subprocess.Popen(command, stdout=stdout_file, stderr=stderr_file)
     if cleanup:
         all_processes[PROCESS_TYPE_MONITOR].append(p)
-    record_log_files_in_redis(redis_address, node_ip_address,
-                              [stdout_file, stderr_file])
+    record_log_files_in_redis(
+        redis_address,
+        node_ip_address, [stdout_file, stderr_file],
+        password=redis_password)
 
 
 def start_raylet_monitor(redis_address,
                          stdout_file=None,
                          stderr_file=None,
-                         cleanup=True):
+                         cleanup=True,
+                         redis_password=None,
+                         config=None):
     """Run a process to monitor the other processes.
 
     Args:
@@ -1297,29 +1260,40 @@ def start_raylet_monitor(redis_address,
             then this process will be killed by services.cleanup() when the
             Python process that imported services exits. This is True by
             default.
+        redis_password (str): The password of the redis server.
+        config (dict|None): Optional configuration that will
+            override defaults in RayConfig.
     """
     gcs_ip_address, gcs_port = redis_address.split(":")
-    command = [RAYLET_MONITOR_EXECUTABLE, gcs_ip_address, gcs_port]
+    redis_password = redis_password or ""
+    config = config or {}
+    config_str = ",".join(["{},{}".format(*kv) for kv in config.items()])
+    command = [RAYLET_MONITOR_EXECUTABLE, gcs_ip_address, gcs_port, config_str]
+    if redis_password:
+        command += [redis_password]
     p = subprocess.Popen(command, stdout=stdout_file, stderr=stderr_file)
     if cleanup:
         all_processes[PROCESS_TYPE_MONITOR].append(p)
 
 
 def start_ray_processes(address_info=None,
+                        object_manager_ports=None,
+                        node_manager_ports=None,
                         node_ip_address="127.0.0.1",
                         redis_port=None,
                         redis_shard_ports=None,
                         num_workers=None,
                         num_local_schedulers=1,
                         object_store_memory=None,
+                        redis_max_memory=None,
+                        collect_profiling_data=True,
                         num_redis_shards=1,
                         redis_max_clients=None,
-                        redis_protected_mode=False,
+                        redis_password=None,
                         worker_path=None,
                         cleanup=True,
                         redirect_worker_output=False,
                         redirect_output=False,
-                        include_global_scheduler=False,
                         include_log_monitor=False,
                         include_webui=False,
                         start_workers_from_local_scheduler=True,
@@ -1327,13 +1301,22 @@ def start_ray_processes(address_info=None,
                         plasma_directory=None,
                         huge_pages=False,
                         autoscaling_config=None,
-                        use_raylet=False):
+                        plasma_store_socket_name=None,
+                        raylet_socket_name=None,
+                        temp_dir=None,
+                        _internal_config=None):
     """Helper method to start Ray processes.
 
     Args:
         address_info (dict): A dictionary with address information for
             processes that have already been started. If provided, address_info
             will be modified to include processes that are newly started.
+        object_manager_ports (list): A list of the ports to use for the object
+            managers. There should be one per object manager being started on
+            this node (typically just one).
+        node_manager_ports (list): A list of the ports to use for the node
+            managers. There should be one per node manager being started on
+            this node (typically just one).
         node_ip_address (str): The IP address of this node.
         redis_port (int): The port that the primary Redis shard should listen
             to. If None, then a random port will be chosen. If the key
@@ -1350,13 +1333,20 @@ def start_ray_processes(address_info=None,
             address_info.
         object_store_memory: The amount of memory (in bytes) to start the
             object store with.
+        redis_max_memory: The max amount of memory (in bytes) to allow redis
+            to use, or None for no limit. Once the limit is exceeded, redis
+            will start LRU eviction of entries. This only applies to the
+            sharded redis tables (task and object tables).
+        collect_profiling_data: Whether to collect profiling data. Note that
+            profiling data cannot be LRU evicted, so if you set
+            redis_max_memory then profiling will also be disabled to prevent
+            it from consuming all available redis memory.
         num_redis_shards: The number of Redis shards to start in addition to
             the primary Redis shard.
         redis_max_clients: If provided, attempt to configure Redis with this
             maxclients number.
-        redis_protected_mode: True if we should start Redis in protected mode.
-            This will prevent clients from other machines from connecting and
-            is only done when Redis is started via ray.init().
+        redis_password (str): Prevents external clients without the password
+            from connecting to Redis if provided.
         worker_path (str): The path of the source code that will be run by the
             worker.
         cleanup (bool): If cleanup is true, then the processes started here
@@ -1366,8 +1356,6 @@ def start_ray_processes(address_info=None,
             processes should be redirected to files.
         redirect_output (bool): True if stdout and stderr for non-worker
             processes should be redirected to files and false otherwise.
-        include_global_scheduler (bool): If include_global_scheduler is True,
-            then start a global scheduler process.
         include_log_monitor (bool): If True, then start a log monitor to
             monitor the log files for all processes on this node and push their
             contents to Redis.
@@ -1383,15 +1371,26 @@ def start_ray_processes(address_info=None,
         huge_pages: Boolean flag indicating whether to start the Object
             Store with hugetlbfs support. Requires plasma_directory.
         autoscaling_config: path to autoscaling config file.
-        use_raylet: True if the new raylet code path should be used. This is
-            not supported yet.
+        plasma_store_socket_name (str): If provided, it will specify the socket
+            name used by the plasma store.
+        raylet_socket_name (str): If provided, it will specify the socket path
+            used by the raylet process.
+        temp_dir (str): If provided, it will specify the root temporary
+            directory for the Ray process.
+        _internal_config (str): JSON configuration for overriding
+            RayConfig defaults. For testing purposes ONLY.
 
     Returns:
         A dictionary of the address information for the processes that were
             started.
     """
-    logger.info(
-        "Process STDOUT and STDERR is being redirected to /tmp/raylogs/.")
+
+    set_temp_root(temp_dir)
+
+    logger.info("Process STDOUT and STDERR is being redirected to {}.".format(
+        get_logs_dir_path()))
+
+    config = json.loads(_internal_config) if _internal_config else None
 
     if resources is None:
         resources = {}
@@ -1399,7 +1398,8 @@ def start_ray_processes(address_info=None,
         resources = num_local_schedulers * [resources]
 
     if num_workers is not None:
-        workers_per_local_scheduler = num_local_schedulers * [num_workers]
+        raise Exception("The 'num_workers' argument is deprecated. Please use "
+                        "'num_cpus' instead.")
     else:
         workers_per_local_scheduler = []
         for resource_dict in resources:
@@ -1429,190 +1429,116 @@ def start_ray_processes(address_info=None,
             redis_shard_ports=redis_shard_ports,
             num_redis_shards=num_redis_shards,
             redis_max_clients=redis_max_clients,
-            use_raylet=use_raylet,
             redirect_output=True,
             redirect_worker_output=redirect_worker_output,
             cleanup=cleanup,
-            protected_mode=redis_protected_mode)
+            password=redis_password,
+            redis_max_memory=redis_max_memory)
         address_info["redis_address"] = redis_address
         time.sleep(0.1)
 
         # Start monitoring the processes.
-        monitor_stdout_file, monitor_stderr_file = new_log_files(
-            "monitor", redirect_output)
+        monitor_stdout_file, monitor_stderr_file = new_monitor_log_file(
+            redirect_output)
         start_monitor(
             redis_address,
             node_ip_address,
             stdout_file=monitor_stdout_file,
             stderr_file=monitor_stderr_file,
             cleanup=cleanup,
-            autoscaling_config=autoscaling_config)
-        if use_raylet:
-            start_raylet_monitor(
-                redis_address,
-                stdout_file=monitor_stdout_file,
-                stderr_file=monitor_stderr_file,
-                cleanup=cleanup)
+            autoscaling_config=autoscaling_config,
+            redis_password=redis_password)
+        start_raylet_monitor(
+            redis_address,
+            stdout_file=monitor_stdout_file,
+            stderr_file=monitor_stderr_file,
+            cleanup=cleanup,
+            redis_password=redis_password,
+            config=config)
     if redis_shards == []:
         # Get redis shards from primary redis instance.
         redis_ip_address, redis_port = redis_address.split(":")
         redis_client = redis.StrictRedis(
-            host=redis_ip_address, port=redis_port)
+            host=redis_ip_address, port=redis_port, password=redis_password)
         redis_shards = redis_client.lrange("RedisShards", start=0, end=-1)
         redis_shards = [ray.utils.decode(shard) for shard in redis_shards]
         address_info["redis_shards"] = redis_shards
 
     # Start the log monitor, if necessary.
     if include_log_monitor:
-        log_monitor_stdout_file, log_monitor_stderr_file = new_log_files(
-            "log_monitor", redirect_output=True)
+        log_monitor_stdout_file, log_monitor_stderr_file = (
+            new_log_monitor_log_file())
         start_log_monitor(
             redis_address,
             node_ip_address,
             stdout_file=log_monitor_stdout_file,
             stderr_file=log_monitor_stderr_file,
-            cleanup=cleanup)
-
-    # Start the global scheduler, if necessary.
-    if include_global_scheduler and not use_raylet:
-        global_scheduler_stdout_file, global_scheduler_stderr_file = (
-            new_log_files("global_scheduler", redirect_output))
-        start_global_scheduler(
-            redis_address,
-            node_ip_address,
-            stdout_file=global_scheduler_stdout_file,
-            stderr_file=global_scheduler_stderr_file,
-            cleanup=cleanup)
+            cleanup=cleanup,
+            redis_password=redis_password)
 
     # Initialize with existing services.
     if "object_store_addresses" not in address_info:
         address_info["object_store_addresses"] = []
     object_store_addresses = address_info["object_store_addresses"]
-    if "local_scheduler_socket_names" not in address_info:
-        address_info["local_scheduler_socket_names"] = []
-    local_scheduler_socket_names = address_info["local_scheduler_socket_names"]
     if "raylet_socket_names" not in address_info:
         address_info["raylet_socket_names"] = []
     raylet_socket_names = address_info["raylet_socket_names"]
 
     # Get the ports to use for the object managers if any are provided.
-    object_manager_ports = (address_info["object_manager_ports"] if
-                            "object_manager_ports" in address_info else None)
     if not isinstance(object_manager_ports, list):
+        assert object_manager_ports is None or num_local_schedulers == 1
         object_manager_ports = num_local_schedulers * [object_manager_ports]
     assert len(object_manager_ports) == num_local_schedulers
+    if not isinstance(node_manager_ports, list):
+        assert node_manager_ports is None or num_local_schedulers == 1
+        node_manager_ports = num_local_schedulers * [node_manager_ports]
+    assert len(node_manager_ports) == num_local_schedulers
 
     # Start any object stores that do not yet exist.
     for i in range(num_local_schedulers - len(object_store_addresses)):
         # Start Plasma.
-        plasma_store_stdout_file, plasma_store_stderr_file = new_log_files(
-            "plasma_store_{}".format(i), redirect_output)
-        plasma_manager_stdout_file, plasma_manager_stderr_file = new_log_files(
-            "plasma_manager_{}".format(i), redirect_output)
+        plasma_store_stdout_file, plasma_store_stderr_file = (
+            new_plasma_store_log_file(i, redirect_output))
+
         object_store_address = start_plasma_store(
             node_ip_address,
             redis_address,
-            object_manager_port=object_manager_ports[i],
             store_stdout_file=plasma_store_stdout_file,
             store_stderr_file=plasma_store_stderr_file,
-            manager_stdout_file=plasma_manager_stdout_file,
-            manager_stderr_file=plasma_manager_stderr_file,
-            objstore_memory=object_store_memory,
+            object_store_memory=object_store_memory,
             cleanup=cleanup,
             plasma_directory=plasma_directory,
             huge_pages=huge_pages,
-            use_raylet=use_raylet)
+            plasma_store_socket_name=plasma_store_socket_name,
+            redis_password=redis_password)
         object_store_addresses.append(object_store_address)
         time.sleep(0.1)
 
-    if not use_raylet:
-        # Start any local schedulers that do not yet exist.
-        for i in range(
-                len(local_scheduler_socket_names), num_local_schedulers):
-            # Connect the local scheduler to the object store at the same
-            # index.
-            object_store_address = object_store_addresses[i]
-            plasma_address = "{}:{}".format(node_ip_address,
-                                            object_store_address.manager_port)
-            # Determine how many workers this local scheduler should start.
-            if start_workers_from_local_scheduler:
-                num_local_scheduler_workers = workers_per_local_scheduler[i]
-                workers_per_local_scheduler[i] = 0
-            else:
-                # If we're starting the workers from Python, the local
-                # scheduler should not start any workers.
-                num_local_scheduler_workers = 0
-            # Start the local scheduler. Note that if we do not wish to
-            # redirect the worker output, then we cannot redirect the local
-            # scheduler output.
-            local_scheduler_stdout_file, local_scheduler_stderr_file = (
-                new_log_files(
-                    "local_scheduler_{}".format(i),
-                    redirect_output=redirect_worker_output))
-            local_scheduler_name = start_local_scheduler(
+    # Start any raylets that do not exist yet.
+    for i in range(len(raylet_socket_names), num_local_schedulers):
+        raylet_stdout_file, raylet_stderr_file = new_raylet_log_file(
+            i, redirect_output=redirect_worker_output)
+        address_info["raylet_socket_names"].append(
+            start_raylet(
                 redis_address,
                 node_ip_address,
-                object_store_address.name,
-                object_store_address.manager_name,
+                raylet_socket_name or get_raylet_socket_name(),
+                object_store_addresses[i],
                 worker_path,
-                plasma_address=plasma_address,
-                stdout_file=local_scheduler_stdout_file,
-                stderr_file=local_scheduler_stderr_file,
-                cleanup=cleanup,
+                object_manager_port=object_manager_ports[i],
+                node_manager_port=node_manager_ports[i],
                 resources=resources[i],
-                num_workers=num_local_scheduler_workers)
-            local_scheduler_socket_names.append(local_scheduler_name)
-
-        # Make sure that we have exactly num_local_schedulers instances of
-        # object stores and local schedulers.
-        assert len(object_store_addresses) == num_local_schedulers
-        assert len(local_scheduler_socket_names) == num_local_schedulers
-
-    else:
-        # Start any raylets that do not exist yet.
-        for i in range(len(raylet_socket_names), num_local_schedulers):
-            raylet_stdout_file, raylet_stderr_file = new_log_files(
-                "raylet_{}".format(i), redirect_output=redirect_worker_output)
-            address_info["raylet_socket_names"].append(
-                start_raylet(
-                    redis_address,
-                    node_ip_address,
-                    object_store_addresses[i].name,
-                    worker_path,
-                    resources=resources[i],
-                    num_workers=workers_per_local_scheduler[i],
-                    stdout_file=raylet_stdout_file,
-                    stderr_file=raylet_stderr_file,
-                    cleanup=cleanup))
-
-    if not use_raylet:
-        # Start any workers that the local scheduler has not already started.
-        for i, num_local_scheduler_workers in enumerate(
-                workers_per_local_scheduler):
-            object_store_address = object_store_addresses[i]
-            local_scheduler_name = local_scheduler_socket_names[i]
-            for j in range(num_local_scheduler_workers):
-                worker_stdout_file, worker_stderr_file = new_log_files(
-                    "worker_{}_{}".format(i, j), redirect_output)
-                start_worker(
-                    node_ip_address,
-                    object_store_address.name,
-                    object_store_address.manager_name,
-                    local_scheduler_name,
-                    redis_address,
-                    worker_path,
-                    stdout_file=worker_stdout_file,
-                    stderr_file=worker_stderr_file,
-                    cleanup=cleanup)
-                workers_per_local_scheduler[i] -= 1
-
-        # Make sure that we've started all the workers.
-        assert (sum(workers_per_local_scheduler) == 0)
+                num_workers=workers_per_local_scheduler[i],
+                stdout_file=raylet_stdout_file,
+                stderr_file=raylet_stderr_file,
+                cleanup=cleanup,
+                redis_password=redis_password,
+                collect_profiling_data=collect_profiling_data,
+                config=config))
 
     # Try to start the web UI.
     if include_webui:
-        ui_stdout_file, ui_stderr_file = new_log_files(
-            "webui", redirect_output=True)
+        ui_stdout_file, ui_stderr_file = new_webui_log_file()
         address_info["webui_url"] = start_ui(
             redis_address,
             stdout_file=ui_stdout_file,
@@ -1627,9 +1553,11 @@ def start_ray_processes(address_info=None,
 def start_ray_node(node_ip_address,
                    redis_address,
                    object_manager_ports=None,
-                   num_workers=0,
+                   node_manager_ports=None,
+                   num_workers=None,
                    num_local_schedulers=1,
                    object_store_memory=None,
+                   redis_password=None,
                    worker_path=None,
                    cleanup=True,
                    redirect_worker_output=False,
@@ -1637,7 +1565,10 @@ def start_ray_node(node_ip_address,
                    resources=None,
                    plasma_directory=None,
                    huge_pages=False,
-                   use_raylet=False):
+                   plasma_store_socket_name=None,
+                   raylet_socket_name=None,
+                   temp_dir=None,
+                   _internal_config=None):
     """Start the Ray processes for a single node.
 
     This assumes that the Ray processes on some master node have already been
@@ -1649,12 +1580,17 @@ def start_ray_node(node_ip_address,
         object_manager_ports (list): A list of the ports to use for the object
             managers. There should be one per object manager being started on
             this node (typically just one).
+        node_manager_ports (list): A list of the ports to use for the node
+            managers. There should be one per node manager being started on
+            this node (typically just one).
         num_workers (int): The number of workers to start.
         num_local_schedulers (int): The number of local schedulers to start.
             This is also the number of plasma stores and plasma managers to
             start.
         object_store_memory (int): The maximum amount of memory (in bytes) to
             let the plasma store use.
+        redis_password (str): Prevents external clients without the password
+            from connecting to Redis if provided.
         worker_path (str): The path of the source code that will be run by the
             worker.
         cleanup (bool): If cleanup is true, then the processes started here
@@ -1670,8 +1606,14 @@ def start_ray_node(node_ip_address,
             be created.
         huge_pages: Boolean flag indicating whether to start the Object
             Store with hugetlbfs support. Requires plasma_directory.
-        use_raylet: True if the new raylet code path should be used. This is
-            not supported yet.
+        plasma_store_socket_name (str): If provided, it will specify the socket
+            name used by the plasma store.
+        raylet_socket_name (str): If provided, it will specify the socket path
+            used by the raylet process.
+        temp_dir (str): If provided, it will specify the root temporary
+            directory for the Ray process.
+        _internal_config (str): JSON configuration for overriding
+            RayConfig defaults. For testing purposes ONLY.
 
     Returns:
         A dictionary of the address information for the processes that were
@@ -1679,14 +1621,16 @@ def start_ray_node(node_ip_address,
     """
     address_info = {
         "redis_address": redis_address,
-        "object_manager_ports": object_manager_ports
     }
     return start_ray_processes(
         address_info=address_info,
+        object_manager_ports=object_manager_ports,
+        node_manager_ports=node_manager_ports,
         node_ip_address=node_ip_address,
         num_workers=num_workers,
         num_local_schedulers=num_local_schedulers,
         object_store_memory=object_store_memory,
+        redis_password=redis_password,
         worker_path=worker_path,
         include_log_monitor=True,
         cleanup=cleanup,
@@ -1695,16 +1639,23 @@ def start_ray_node(node_ip_address,
         resources=resources,
         plasma_directory=plasma_directory,
         huge_pages=huge_pages,
-        use_raylet=use_raylet)
+        plasma_store_socket_name=plasma_store_socket_name,
+        raylet_socket_name=raylet_socket_name,
+        temp_dir=temp_dir,
+        _internal_config=_internal_config)
 
 
 def start_ray_head(address_info=None,
+                   object_manager_ports=None,
+                   node_manager_ports=None,
                    node_ip_address="127.0.0.1",
                    redis_port=None,
                    redis_shard_ports=None,
-                   num_workers=0,
+                   num_workers=None,
                    num_local_schedulers=1,
                    object_store_memory=None,
+                   redis_max_memory=None,
+                   collect_profiling_data=True,
                    worker_path=None,
                    cleanup=True,
                    redirect_worker_output=False,
@@ -1713,18 +1664,27 @@ def start_ray_head(address_info=None,
                    resources=None,
                    num_redis_shards=None,
                    redis_max_clients=None,
-                   redis_protected_mode=False,
+                   redis_password=None,
                    include_webui=True,
                    plasma_directory=None,
                    huge_pages=False,
                    autoscaling_config=None,
-                   use_raylet=False):
+                   plasma_store_socket_name=None,
+                   raylet_socket_name=None,
+                   temp_dir=None,
+                   _internal_config=None):
     """Start Ray in local mode.
 
     Args:
         address_info (dict): A dictionary with address information for
             processes that have already been started. If provided, address_info
             will be modified to include processes that are newly started.
+        object_manager_ports (list): A list of the ports to use for the object
+            managers. There should be one per object manager being started on
+            this node (typically just one).
+        node_manager_ports (list): A list of the ports to use for the node
+            managers. There should be one per node manager being started on
+            this node (typically just one).
         node_ip_address (str): The IP address of this node.
         redis_port (int): The port that the primary Redis shard should listen
             to. If None, then a random port will be chosen. If the key
@@ -1741,6 +1701,11 @@ def start_ray_head(address_info=None,
             address_info.
         object_store_memory: The amount of memory (in bytes) to start the
             object store with.
+        redis_max_memory: The max amount of memory (in bytes) to allow redis
+            to use, or None for no limit. Once the limit is exceeded, redis
+            will start LRU eviction of entries. This only applies to the
+            sharded redis tables (task and object tables).
+        collect_profiling_data: Whether to collect profiling data from workers.
         worker_path (str): The path of the source code that will be run by the
             worker.
         cleanup (bool): If cleanup is true, then the processes started here
@@ -1759,17 +1724,22 @@ def start_ray_head(address_info=None,
             the primary Redis shard.
         redis_max_clients: If provided, attempt to configure Redis with this
             maxclients number.
-        redis_protected_mode: True if we should start Redis in protected mode.
-            This will prevent clients from other machines from connecting and
-            is only done when Redis is started via ray.init().
+        redis_password (str): Prevents external clients without the password
+            from connecting to Redis if provided.
         include_webui: True if the UI should be started and false otherwise.
         plasma_directory: A directory where the Plasma memory mapped files will
             be created.
         huge_pages: Boolean flag indicating whether to start the Object
             Store with hugetlbfs support. Requires plasma_directory.
         autoscaling_config: path to autoscaling config file.
-        use_raylet: True if the new raylet code path should be used. This is
-            not supported yet.
+        plasma_store_socket_name (str): If provided, it will specify the socket
+            name used by the plasma store.
+        raylet_socket_name (str): If provided, it will specify the socket path
+            used by the raylet process.
+        temp_dir (str): If provided, it will specify the root temporary
+            directory for the Ray process.
+        _internal_config (str): JSON configuration for overriding
+            RayConfig defaults. For testing purposes ONLY.
 
     Returns:
         A dictionary of the address information for the processes that were
@@ -1778,79 +1748,31 @@ def start_ray_head(address_info=None,
     num_redis_shards = 1 if num_redis_shards is None else num_redis_shards
     return start_ray_processes(
         address_info=address_info,
+        object_manager_ports=object_manager_ports,
+        node_manager_ports=node_manager_ports,
         node_ip_address=node_ip_address,
         redis_port=redis_port,
         redis_shard_ports=redis_shard_ports,
         num_workers=num_workers,
         num_local_schedulers=num_local_schedulers,
         object_store_memory=object_store_memory,
+        redis_max_memory=redis_max_memory,
+        collect_profiling_data=collect_profiling_data,
         worker_path=worker_path,
         cleanup=cleanup,
         redirect_worker_output=redirect_worker_output,
         redirect_output=redirect_output,
-        include_global_scheduler=True,
         include_log_monitor=True,
         include_webui=include_webui,
         start_workers_from_local_scheduler=start_workers_from_local_scheduler,
         resources=resources,
         num_redis_shards=num_redis_shards,
         redis_max_clients=redis_max_clients,
-        redis_protected_mode=redis_protected_mode,
+        redis_password=redis_password,
         plasma_directory=plasma_directory,
         huge_pages=huge_pages,
         autoscaling_config=autoscaling_config,
-        use_raylet=use_raylet)
-
-
-def try_to_create_directory(directory_path):
-    """Attempt to create a directory that is globally readable/writable.
-
-    Args:
-        directory_path: The path of the directory to create.
-    """
-    if not os.path.exists(directory_path):
-        try:
-            os.makedirs(directory_path)
-        except OSError as e:
-            if e.errno != os.errno.EEXIST:
-                raise e
-            logger.warning(
-                "Attempted to create '{}', but the directory already "
-                "exists.".format(directory_path))
-        # Change the log directory permissions so others can use it. This is
-        # important when multiple people are using the same machine.
-        os.chmod(directory_path, 0o0777)
-
-
-def new_log_files(name, redirect_output):
-    """Generate partially randomized filenames for log files.
-
-    Args:
-        name (str): descriptive string for this log file.
-        redirect_output (bool): True if files should be generated for logging
-            stdout and stderr and false if stdout and stderr should not be
-            redirected.
-
-    Returns:
-        If redirect_output is true, this will return a tuple of two
-            filehandles. The first is for redirecting stdout and the second is
-            for redirecting stderr. If redirect_output is false, this will
-            return a tuple of two None objects.
-    """
-    if not redirect_output:
-        return None, None
-
-    # Create a directory to be used for process log files.
-    logs_dir = "/tmp/raylogs"
-    try_to_create_directory(logs_dir)
-    # Create another directory that will be used by some of the RL algorithms.
-    try_to_create_directory("/tmp/ray")
-
-    log_id = random.randint(0, 10000)
-    date_str = datetime.today().strftime("%Y-%m-%d_%H-%M-%S")
-    log_stdout = "{}/{}-{}-{:05d}.out".format(logs_dir, name, date_str, log_id)
-    log_stderr = "{}/{}-{}-{:05d}.err".format(logs_dir, name, date_str, log_id)
-    # Line-buffer the output (mode 1)
-    log_stdout_file = open(log_stdout, "a", buffering=1)
-    log_stderr_file = open(log_stderr, "a", buffering=1)
-    return log_stdout_file, log_stderr_file
+        plasma_store_socket_name=plasma_store_socket_name,
+        raylet_socket_name=raylet_socket_name,
+        temp_dir=temp_dir,
+        _internal_config=_internal_config)
diff --git a/python/ray/tempfile_services.py b/python/ray/tempfile_services.py
new file mode 100644
index 0000000000000..d4e94aec8a2ae
--- /dev/null
+++ b/python/ray/tempfile_services.py
@@ -0,0 +1,226 @@
+import binascii
+import collections
+import datetime
+import errno
+import logging
+import os
+import shutil
+import tempfile
+
+import ray.utils
+
+logger = logging.getLogger(__name__)
+_incremental_dict = collections.defaultdict(lambda: 0)
+_temp_root = None
+
+
+def make_inc_temp(suffix="", prefix="", directory_name="/tmp/ray"):
+    """Return a incremental temporary file name. The file is not created.
+
+    Args:
+        suffix (str): The suffix of the temp file.
+        prefix (str): The prefix of the temp file.
+        directory_name (str) : The base directory of the temp file.
+
+    Returns:
+        A string of file name. If there existing a file having the same name,
+        the returned name will look like
+        "{directory_name}/{prefix}.{unique_index}{suffix}"
+    """
+    directory_name = os.path.expanduser(directory_name)
+    index = _incremental_dict[suffix, prefix, directory_name]
+    # `tempfile.TMP_MAX` could be extremely large,
+    # so using `range` in Python2.x should be avoided.
+    while index < tempfile.TMP_MAX:
+        if index == 0:
+            filename = os.path.join(directory_name, prefix + suffix)
+        else:
+            filename = os.path.join(directory_name,
+                                    prefix + "." + str(index) + suffix)
+        index += 1
+        if not os.path.exists(filename):
+            _incremental_dict[suffix, prefix,
+                              directory_name] = index  # Save the index.
+            return filename
+
+    raise FileExistsError(errno.EEXIST, "No usable temporary filename found")
+
+
+def try_to_create_directory(directory_path):
+    """Attempt to create a directory that is globally readable/writable.
+
+    Args:
+        directory_path: The path of the directory to create.
+    """
+    directory_path = os.path.expanduser(directory_path)
+    if not os.path.exists(directory_path):
+        try:
+            os.makedirs(directory_path)
+        except OSError as e:
+            if e.errno != os.errno.EEXIST:
+                raise e
+            logger.warning(
+                "Attempted to create '{}', but the directory already "
+                "exists.".format(directory_path))
+        # Change the log directory permissions so others can use it. This is
+        # important when multiple people are using the same machine.
+        os.chmod(directory_path, 0o0777)
+
+
+def get_temp_root():
+    """Get the path of the temporary root. If not existing, it will be created.
+    """
+    global _temp_root
+
+    date_str = datetime.datetime.today().strftime("%Y-%m-%d_%H-%M-%S")
+
+    # Lazy creation. Avoid creating directories never used.
+    if _temp_root is None:
+        _temp_root = make_inc_temp(
+            prefix="session_{date_str}_{pid}".format(
+                pid=os.getpid(), date_str=date_str),
+            directory_name="/tmp/ray")
+    try_to_create_directory(_temp_root)
+    return _temp_root
+
+
+def set_temp_root(path):
+    """Set the path of the temporary root. It will be created lazily."""
+    global _temp_root
+    _temp_root = path
+
+
+def get_logs_dir_path():
+    """Get a temp dir for logging."""
+    logs_dir = os.path.join(get_temp_root(), "logs")
+    try_to_create_directory(logs_dir)
+    return logs_dir
+
+
+def get_sockets_dir_path():
+    """Get a temp dir for sockets."""
+    sockets_dir = os.path.join(get_temp_root(), "sockets")
+    try_to_create_directory(sockets_dir)
+    return sockets_dir
+
+
+def get_raylet_socket_name(suffix=""):
+    """Get a socket name for raylet."""
+    sockets_dir = get_sockets_dir_path()
+
+    raylet_socket_name = make_inc_temp(
+        prefix="raylet", directory_name=sockets_dir, suffix=suffix)
+    return raylet_socket_name
+
+
+def get_object_store_socket_name():
+    """Get a socket name for plasma object store."""
+    sockets_dir = get_sockets_dir_path()
+    return make_inc_temp(prefix="plasma_store", directory_name=sockets_dir)
+
+
+def get_ipython_notebook_path(port):
+    """Get a new ipython notebook path"""
+
+    notebook_filepath = os.path.join(
+        os.path.dirname(os.path.abspath(__file__)), "WebUI.ipynb")
+    # We copy the notebook file so that the original doesn't get modified by
+    # the user.
+    notebook_name = make_inc_temp(
+        suffix=".ipynb", prefix="ray_ui", directory_name=get_temp_root())
+    shutil.copy(notebook_filepath, notebook_name)
+    new_notebook_directory = os.path.dirname(notebook_name)
+    token = ray.utils.decode(binascii.hexlify(os.urandom(24)))
+    webui_url = ("http://localhost:{}/notebooks/{}?token={}".format(
+        port, os.path.basename(notebook_name), token))
+    return new_notebook_directory, webui_url, token
+
+
+def new_log_files(name, redirect_output):
+    """Generate partially randomized filenames for log files.
+
+    Args:
+        name (str): descriptive string for this log file.
+        redirect_output (bool): True if files should be generated for logging
+            stdout and stderr and false if stdout and stderr should not be
+            redirected.
+
+    Returns:
+        If redirect_output is true, this will return a tuple of two
+            filehandles. The first is for redirecting stdout and the second is
+            for redirecting stderr. If redirect_output is false, this will
+            return a tuple of two None objects.
+    """
+    if not redirect_output:
+        return None, None
+
+    # Create a directory to be used for process log files.
+    logs_dir = get_logs_dir_path()
+    # Create another directory that will be used by some of the RL algorithms.
+
+    # TODO(suquark): This is done by the old code.
+    # We should be able to control its path later.
+    try_to_create_directory("/tmp/ray")
+
+    log_stdout = make_inc_temp(
+        suffix=".out", prefix=name, directory_name=logs_dir)
+    log_stderr = make_inc_temp(
+        suffix=".err", prefix=name, directory_name=logs_dir)
+    # Line-buffer the output (mode 1)
+    log_stdout_file = open(log_stdout, "a", buffering=1)
+    log_stderr_file = open(log_stderr, "a", buffering=1)
+    return log_stdout_file, log_stderr_file
+
+
+def new_redis_log_file(redirect_output, shard_number=None):
+    """Create new logging files for redis"""
+    if shard_number is None:
+        redis_stdout_file, redis_stderr_file = new_log_files(
+            "redis", redirect_output)
+    else:
+        redis_stdout_file, redis_stderr_file = new_log_files(
+            "redis-shard_{}".format(shard_number), redirect_output)
+    return redis_stdout_file, redis_stderr_file
+
+
+def new_raylet_log_file(local_scheduler_index, redirect_output):
+    """Create new logging files for raylet."""
+    raylet_stdout_file, raylet_stderr_file = new_log_files(
+        "raylet_{}".format(local_scheduler_index),
+        redirect_output=redirect_output)
+    return raylet_stdout_file, raylet_stderr_file
+
+
+def new_webui_log_file():
+    """Create new logging files for web ui."""
+    ui_stdout_file, ui_stderr_file = new_log_files(
+        "webui", redirect_output=True)
+    return ui_stdout_file, ui_stderr_file
+
+
+def new_worker_redirected_log_file(worker_id):
+    """Create new logging files for workers to redirect its output."""
+    worker_stdout_file, worker_stderr_file = (new_log_files(
+        "worker-" + ray.utils.binary_to_hex(worker_id), True))
+    return worker_stdout_file, worker_stderr_file
+
+
+def new_log_monitor_log_file():
+    """Create new logging files for the log monitor."""
+    log_monitor_stdout_file, log_monitor_stderr_file = new_log_files(
+        "log_monitor", redirect_output=True)
+    return log_monitor_stdout_file, log_monitor_stderr_file
+
+
+def new_plasma_store_log_file(local_scheduler_index, redirect_output):
+    """Create new logging files for the plasma store."""
+    plasma_store_stdout_file, plasma_store_stderr_file = new_log_files(
+        "plasma_store_{}".format(local_scheduler_index), redirect_output)
+    return plasma_store_stdout_file, plasma_store_stderr_file
+
+
+def new_monitor_log_file(redirect_output):
+    """Create new logging files for the monitor."""
+    monitor_stdout_file, monitor_stderr_file = new_log_files(
+        "monitor", redirect_output)
+    return monitor_stdout_file, monitor_stderr_file
diff --git a/python/ray/test/cluster_utils.py b/python/ray/test/cluster_utils.py
new file mode 100644
index 0000000000000..41dc3b6cdd26a
--- /dev/null
+++ b/python/ray/test/cluster_utils.py
@@ -0,0 +1,226 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import atexit
+import logging
+import time
+
+import ray
+import ray.services as services
+
+logger = logging.getLogger(__name__)
+
+
+class Cluster(object):
+    def __init__(self,
+                 initialize_head=False,
+                 connect=False,
+                 head_node_args=None,
+                 shutdown_at_exit=True):
+        """Initializes the cluster.
+
+        Args:
+            initialize_head (bool): Automatically start a Ray cluster
+                by initializing the head node. Defaults to False.
+            connect (bool): If `initialize_head=True` and `connect=True`,
+                ray.init will be called with the redis address of this cluster
+                passed in.
+            head_node_args (dict): Arguments to be passed into
+                `start_ray_head` via `self.add_node`.
+            shutdown_at_exit (bool): If True, registers an exit hook
+                for shutting down all started processes.
+        """
+        self.head_node = None
+        self.worker_nodes = {}
+        self.redis_address = None
+        if not initialize_head and connect:
+            raise RuntimeError("Cannot connect to uninitialized cluster.")
+
+        if initialize_head:
+            head_node_args = head_node_args or {}
+            self.add_node(**head_node_args)
+            if connect:
+                redis_password = head_node_args.get("redis_password")
+                output_info = ray.init(
+                    redis_address=self.redis_address,
+                    redis_password=redis_password)
+                logger.info(output_info)
+        if shutdown_at_exit:
+            atexit.register(self.shutdown)
+
+    def add_node(self, **override_kwargs):
+        """Adds a node to the local Ray Cluster.
+
+        All nodes are by default started with the following settings:
+            cleanup=True,
+            resources={"CPU": 1},
+            object_store_memory=100 * (2**20) # 100 MB
+
+        Args:
+            override_kwargs: Keyword arguments used in `start_ray_head`
+                and `start_ray_node`. Overrides defaults.
+
+        Returns:
+            Node object of the added Ray node.
+        """
+        node_kwargs = {
+            "cleanup": True,
+            "resources": {
+                "CPU": 1
+            },
+            "object_store_memory": 100 * (2**20)  # 100 MB
+        }
+        node_kwargs.update(override_kwargs)
+
+        if self.head_node is None:
+            address_info = services.start_ray_head(
+                node_ip_address=services.get_node_ip_address(),
+                include_webui=False,
+                **node_kwargs)
+            self.redis_address = address_info["redis_address"]
+            # TODO(rliaw): Find a more stable way than modifying global state.
+            process_dict_copy = services.all_processes.copy()
+            for key in services.all_processes:
+                services.all_processes[key] = []
+            node = Node(process_dict_copy)
+            self.head_node = node
+        else:
+            address_info = services.start_ray_node(
+                services.get_node_ip_address(), self.redis_address,
+                **node_kwargs)
+            # TODO(rliaw): Find a more stable way than modifying global state.
+            process_dict_copy = services.all_processes.copy()
+            for key in services.all_processes:
+                services.all_processes[key] = []
+            node = Node(process_dict_copy)
+            self.worker_nodes[node] = address_info
+        logger.info("Starting Node with raylet socket {}".format(
+            address_info["raylet_socket_names"]))
+
+        return node
+
+    def remove_node(self, node):
+        """Kills all processes associated with worker node.
+
+        Args:
+            node (Node): Worker node of which all associated processes
+                will be removed.
+        """
+        if self.head_node == node:
+            self.head_node.kill_all_processes()
+            self.head_node = None
+            # TODO(rliaw): Do we need to kill all worker processes?
+        else:
+            node.kill_all_processes()
+            self.worker_nodes.pop(node)
+
+        assert not node.any_processes_alive(), (
+            "There are zombie processes left over after killing.")
+
+    def wait_for_nodes(self, retries=30):
+        """Waits for all nodes to be registered with global state.
+
+        By default, waits for 3 seconds.
+
+        Args:
+            retries (int): Number of times to retry checking client table.
+
+        Returns:
+            True if successfully registered nodes as expected.
+        """
+
+        for i in range(retries):
+            if not ray.is_initialized() or not self._check_registered_nodes():
+                time.sleep(0.1)
+            else:
+                return True
+        return False
+
+    def _check_registered_nodes(self):
+        registered = len([
+            client for client in ray.global_state.client_table()
+            if client["IsInsertion"]
+        ])
+        expected = len(self.list_all_nodes())
+        if registered == expected:
+            logger.info("All nodes registered as expected.")
+        else:
+            logger.info("Currently registering {} but expecting {}".format(
+                registered, expected))
+        return registered == expected
+
+    def list_all_nodes(self):
+        """Lists all nodes.
+
+        TODO(rliaw): What is the desired behavior if a head node
+        dies before worker nodes die?
+
+        Returns:
+            List of all nodes, including the head node.
+        """
+        nodes = list(self.worker_nodes)
+        if self.head_node:
+            nodes = [self.head_node] + nodes
+        return nodes
+
+    def shutdown(self):
+        """Removes all nodes."""
+
+        # We create a list here as a copy because `remove_node`
+        # modifies `self.worker_nodes`.
+        all_nodes = list(self.worker_nodes)
+        for node in all_nodes:
+            self.remove_node(node)
+
+        if self.head_node:
+            self.remove_node(self.head_node)
+        else:
+            logger.warning("No headnode exists!")
+
+
+class Node(object):
+    """Abstraction for a Ray node."""
+
+    def __init__(self, process_dict):
+        # TODO(rliaw): Is there a unique identifier for a node?
+        self.process_dict = process_dict
+
+    def kill_plasma_store(self):
+        self.process_dict[services.PROCESS_TYPE_PLASMA_STORE][0].kill()
+        self.process_dict[services.PROCESS_TYPE_PLASMA_STORE][0].wait()
+
+    def kill_raylet(self):
+        self.process_dict[services.PROCESS_TYPE_RAYLET][0].kill()
+        self.process_dict[services.PROCESS_TYPE_RAYLET][0].wait()
+
+    def kill_log_monitor(self):
+        self.process_dict["log_monitor"][0].kill()
+        self.process_dict["log_monitor"][0].wait()
+
+    def kill_all_processes(self):
+        for process_name, process_list in self.process_dict.items():
+            logger.info("Killing all {}(s)".format(process_name))
+            for process in process_list:
+                # Kill the process if it is still alive.
+                if process.poll() is None:
+                    process.kill()
+
+        for process_name, process_list in self.process_dict.items():
+            logger.info("Waiting all {}(s)".format(process_name))
+            for process in process_list:
+                process.wait()
+
+    def live_processes(self):
+        return [(p_name, proc) for p_name, p_list in self.process_dict.items()
+                for proc in p_list if proc.poll() is None]
+
+    def dead_processes(self):
+        return [(p_name, proc) for p_name, p_list in self.process_dict.items()
+                for proc in p_list if proc.poll() is not None]
+
+    def any_processes_alive(self):
+        return any(self.live_processes())
+
+    def all_processes_alive(self):
+        return not any(self.dead_processes())
diff --git a/python/ray/test/test_global_state.py b/python/ray/test/test_global_state.py
index 7b12ee0227902..68805a8ec5612 100644
--- a/python/ray/test/test_global_state.py
+++ b/python/ray/test/test_global_state.py
@@ -2,57 +2,107 @@
 from __future__ import division
 from __future__ import print_function
 
+import json
+import pytest
+try:
+    import pytest_timeout
+except ImportError:
+    pytest_timeout = None
 import time
 
 import ray
-
-
-def setup_module():
-    if not ray.worker.global_worker.connected:
-        ray.init(num_cpus=1)
-
-    # Finish initializing Ray. Otherwise available_resources() does not
-    # reflect resource use of submitted tasks
-    ray.get(cpu_task.remote(0))
-
-
-@ray.remote(num_cpus=1)
-def cpu_task(seconds):
-    time.sleep(seconds)
-
-
-class TestAvailableResources(object):
-    timeout = 10
-
-    def test_no_tasks(self):
-        cluster_resources = ray.global_state.cluster_resources()
+from ray.test.cluster_utils import Cluster
+
+
+@pytest.fixture
+def ray_start():
+    # Start the Ray processes.
+    ray.init(num_cpus=1)
+    yield None
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+
+
+@pytest.fixture
+def cluster_start():
+    # Start the Ray processes.
+    cluster = Cluster(
+        initialize_head=True,
+        connect=True,
+        head_node_args={
+            "resources": dict(CPU=1),
+            "_internal_config": json.dumps({
+                "num_heartbeats_timeout": 10
+            })
+        })
+    yield cluster
+    ray.shutdown()
+    cluster.shutdown()
+
+
+# TODO(rliaw): The proper way to do this is to have the pytest config setup.
+@pytest.mark.skipif(
+    pytest_timeout is None,
+    reason="Timeout package not installed; skipping test that may hang.")
+@pytest.mark.timeout(10)
+def test_replenish_resources(ray_start):
+    cluster_resources = ray.global_state.cluster_resources()
+    available_resources = ray.global_state.available_resources()
+    assert cluster_resources == available_resources
+
+    @ray.remote
+    def cpu_task():
+        pass
+
+    ray.get(cpu_task.remote())
+    resources_reset = False
+
+    while not resources_reset:
         available_resources = ray.global_state.available_resources()
-        assert cluster_resources == available_resources
-
-    def test_replenish_resources(self):
-        cluster_resources = ray.global_state.cluster_resources()
+        resources_reset = (cluster_resources == available_resources)
+    assert resources_reset
 
-        ray.get(cpu_task.remote(0))
-        start = time.time()
-        resources_reset = False
 
-        while not resources_reset and time.time() - start < self.timeout:
-            available_resources = ray.global_state.available_resources()
-            resources_reset = (cluster_resources == available_resources)
+@pytest.mark.skipif(
+    pytest_timeout is None,
+    reason="Timeout package not installed; skipping test that may hang.")
+@pytest.mark.timeout(10)
+def test_uses_resources(ray_start):
+    cluster_resources = ray.global_state.cluster_resources()
 
-        assert resources_reset
+    @ray.remote
+    def cpu_task():
+        time.sleep(1)
 
-    def test_uses_resources(self):
-        cluster_resources = ray.global_state.cluster_resources()
-        task_id = cpu_task.remote(1)
-        start = time.time()
-        resource_used = False
+    cpu_task.remote()
+    resource_used = False
 
-        while not resource_used and time.time() - start < self.timeout:
-            available_resources = ray.global_state.available_resources()
-            resource_used = available_resources[
-                "CPU"] == cluster_resources["CPU"] - 1
-
-        assert resource_used
-
-        ray.get(task_id)  # clean up to reset resources
+    while not resource_used:
+        available_resources = ray.global_state.available_resources()
+        resource_used = available_resources[
+            "CPU"] == cluster_resources["CPU"] - 1
+
+    assert resource_used
+
+
+@pytest.mark.skipif(
+    pytest_timeout is None,
+    reason="Timeout package not installed; skipping test that may hang.")
+@pytest.mark.timeout(20)
+def test_add_remove_cluster_resources(cluster_start):
+    """Tests that Global State API is consistent with actual cluster."""
+    cluster = cluster_start
+    assert ray.global_state.cluster_resources()["CPU"] == 1
+    nodes = []
+    nodes += [cluster.add_node(resources=dict(CPU=1))]
+    assert cluster.wait_for_nodes()
+    assert ray.global_state.cluster_resources()["CPU"] == 2
+
+    cluster.remove_node(nodes.pop())
+    assert cluster.wait_for_nodes()
+    assert ray.global_state.cluster_resources()["CPU"] == 1
+
+    for i in range(5):
+        nodes += [cluster.add_node(resources=dict(CPU=1))]
+    assert cluster.wait_for_nodes()
+    assert ray.global_state.cluster_resources()["CPU"] == 6
diff --git a/python/ray/test/test_modin.py b/python/ray/test/test_modin.py
new file mode 100644
index 0000000000000..83c11895ec7b8
--- /dev/null
+++ b/python/ray/test/test_modin.py
@@ -0,0 +1,12 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import ray  # noqa F401
+
+
+def test_modin_import():
+    import modin.pandas as pd
+    frame_data = [1, 2, 3, 4, 5, 6, 7, 8]
+    frame = pd.DataFrame(frame_data)
+    assert frame.sum().squeeze() == sum(frame_data)
diff --git a/python/ray/test/test_ray_init.py b/python/ray/test/test_ray_init.py
new file mode 100644
index 0000000000000..2b17ce35ef286
--- /dev/null
+++ b/python/ray/test/test_ray_init.py
@@ -0,0 +1,70 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import os
+import pytest
+import redis
+
+import ray
+from ray.test.cluster_utils import Cluster
+
+
+@pytest.fixture
+def password():
+    random_bytes = os.urandom(128)
+    if hasattr(random_bytes, "hex"):
+        return random_bytes.hex()  # Python 3
+    return random_bytes.encode("hex")  # Python 2
+
+
+@pytest.fixture
+def shutdown_only():
+    yield None
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+
+
+class TestRedisPassword(object):
+    @pytest.mark.skipif(
+        os.environ.get("RAY_USE_NEW_GCS") == "on",
+        reason="New GCS API doesn't support Redis authentication yet.")
+    def test_redis_password(self, password, shutdown_only):
+        @ray.remote
+        def f():
+            return 1
+
+        info = ray.init(redis_password=password)
+        redis_address = info["redis_address"]
+        redis_ip, redis_port = redis_address.split(":")
+
+        # Check that we can run a task
+        object_id = f.remote()
+        ray.get(object_id)
+
+        # Check that Redis connections require a password
+        redis_client = redis.StrictRedis(
+            host=redis_ip, port=redis_port, password=None)
+        with pytest.raises(redis.ResponseError):
+            redis_client.ping()
+
+        # Check that we can connect to Redis using the provided password
+        redis_client = redis.StrictRedis(
+            host=redis_ip, port=redis_port, password=password)
+        assert redis_client.ping()
+
+    @pytest.mark.skipif(
+        os.environ.get("RAY_USE_NEW_GCS") == "on",
+        reason="New GCS API doesn't support Redis authentication yet.")
+    def test_redis_password_cluster(self, password, shutdown_only):
+        @ray.remote
+        def f():
+            return 1
+
+        node_args = {"redis_password": password}
+        cluster = Cluster(
+            initialize_head=True, connect=True, head_node_args=node_args)
+        cluster.add_node(**node_args)
+
+        object_id = f.remote()
+        ray.get(object_id)
diff --git a/python/ray/test/test_utils.py b/python/ray/test/test_utils.py
index a29daa5a073ec..a3614650e97ba 100644
--- a/python/ray/test/test_utils.py
+++ b/python/ray/test/test_utils.py
@@ -6,6 +6,7 @@
 import os
 import redis
 import subprocess
+import sys
 import tempfile
 import time
 
@@ -34,22 +35,11 @@ def _wait_for_nodes_to_join(num_nodes, timeout=20):
         client_table = ray.global_state.client_table()
         num_ready_nodes = len(client_table)
         if num_ready_nodes == num_nodes:
-            ready = True
             # Check that for each node, a local scheduler and a plasma manager
             # are present.
-            if ray.global_state.use_raylet:
-                # In raylet mode, this is a list of map.
-                # The GCS info will appear as a whole instead of part by part.
-                return
-            else:
-                for ip_address, clients in client_table.items():
-                    client_types = [client["ClientType"] for client in clients]
-                    if "local_scheduler" not in client_types:
-                        ready = False
-                    if "plasma_manager" not in client_types:
-                        ready = False
-                if ready:
-                    return
+            # In raylet mode, this is a list of map.
+            # The GCS info will appear as a whole instead of part by part.
+            return
         if num_ready_nodes > num_nodes:
             # Too many nodes have joined. Something must be wrong.
             raise Exception("{} nodes have joined the cluster, but we were "
@@ -147,3 +137,40 @@ def run_and_get_output(command):
         with open(tmp.name, 'r') as f:
             result = f.readlines()
             return "\n".join(result)
+
+
+def run_string_as_driver(driver_script):
+    """Run a driver as a separate process.
+
+    Args:
+        driver_script: A string to run as a Python script.
+
+    Returns:
+        The script's output.
+    """
+    # Save the driver script as a file so we can call it using subprocess.
+    with tempfile.NamedTemporaryFile() as f:
+        f.write(driver_script.encode("ascii"))
+        f.flush()
+        out = ray.utils.decode(
+            subprocess.check_output([sys.executable, f.name]))
+    return out
+
+
+def run_string_as_driver_nonblocking(driver_script):
+    """Start a driver as a separate process and return immediately.
+
+    Args:
+        driver_script: A string to run as a Python script.
+
+    Returns:
+        A handle to the driver process.
+    """
+    # Save the driver script as a file so we can call it using subprocess. We
+    # do not delete this file because if we do then it may get removed before
+    # the Python process tries to run it.
+    with tempfile.NamedTemporaryFile(delete=False) as f:
+        f.write(driver_script.encode("ascii"))
+        f.flush()
+        return subprocess.Popen(
+            [sys.executable, f.name], stdout=subprocess.PIPE)
diff --git a/python/ray/tune/README.rst b/python/ray/tune/README.rst
index 2d7533f56a0f6..5635ab3ff8856 100644
--- a/python/ray/tune/README.rst
+++ b/python/ray/tune/README.rst
@@ -6,6 +6,14 @@ Tune is a scalable framework for hyperparameter search with a focus on deep lear
 User documentation can be `found here <http://ray.readthedocs.io/en/latest/tune.html>`__.
 
 
+Tutorial
+--------
+
+To get started with Tune, try going through `our tutorial of using Tune with Keras <https://github.com/ray-project/tutorial/blob/master/tune_exercises/Tune.ipynb>`__.
+
+(Experimental): You can try out `the above tutorial on a free hosted server via Binder <https://mybinder.org/v2/gh/ray-project/tutorial/master?filepath=tune_exercises%2FTune.ipynb>`__.
+
+
 Citing Tune
 -----------
 
diff --git a/python/ray/tune/__init__.py b/python/ray/tune/__init__.py
index 83d4f4fdece37..1e341b26526ea 100644
--- a/python/ray/tune/__init__.py
+++ b/python/ray/tune/__init__.py
@@ -7,9 +7,16 @@
 from ray.tune.experiment import Experiment
 from ray.tune.registry import register_env, register_trainable
 from ray.tune.trainable import Trainable
-from ray.tune.suggest import grid_search, function
+from ray.tune.suggest import grid_search, function, sample_from
 
 __all__ = [
-    "Trainable", "TuneError", "grid_search", "register_env",
-    "register_trainable", "run_experiments", "Experiment", "function"
+    "Trainable",
+    "TuneError",
+    "grid_search",
+    "register_env",
+    "register_trainable",
+    "run_experiments",
+    "Experiment",
+    "function",
+    "sample_from",
 ]
diff --git a/python/ray/tune/examples/README.rst b/python/ray/tune/examples/README.rst
index 3d35497c8841a..a762a057021c3 100644
--- a/python/ray/tune/examples/README.rst
+++ b/python/ray/tune/examples/README.rst
@@ -1,4 +1,60 @@
 Tune Examples
 =============
 
-Code examples for various schedulers and Tune features.
+.. Keep this in sync with ray/doc/tune-examples.rst
+
+In our repository, we provide a variety of examples for the various use cases and features of Tune.
+
+If any example is broken, or if you'd like to add an example to this page, feel free to raise an issue on our Github repository.
+
+
+General Examples
+----------------
+
+- `async_hyperband_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/async_hyperband_example.py>`__:
+   Example of using a Trainable class with AsyncHyperBandScheduler.
+- `hyperband_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/hyperband_example.py>`__:
+   Example of using a Trainable class with HyperBandScheduler. Also uses the Experiment class API for specifying the experiment configuration.
+- `hyperopt_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/hyperopt_example.py>`__:
+   Optimizes a basic function using the function-based API and the HyperOptSearch (SearchAlgorithm wrapper for HyperOpt TPE).
+   Also uses the AsyncHyperBandScheduler.
+- `pbt_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/pbt_example.py>`__:
+   Example of using a Trainable class with PopulationBasedTraining scheduler.
+- `pbt_ppo_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/pbt_ppo_example.py>`__:
+   Example of optimizing a distributed RLlib algorithm (PPO) with the PopulationBasedTraining scheduler.
+
+
+Keras Examples
+--------------
+
+- `tune_mnist_keras <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/tune_mnist_keras.py>`__:
+   Converts the Keras MNIST example to use Tune with the function-based API and a Keras callback. Also shows how to easily convert something relying on argparse to use Tune.
+
+
+PyTorch Examples
+----------------
+
+- `mnist_pytorch <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/mnist_pytorch.py>`__:
+   Converts the PyTorch MNIST example to use Tune with the function-based API. Also shows how to easily convert something relying on argparse to use Tune.
+- `mnist_pytorch_trainable <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/mnist_pytorch_trainable.py>`__:
+   Converts the PyTorch MNIST example to use Tune with Trainable API. Also uses the HyperBandScheduler and checkpoints the model at the end.
+
+
+TensorFlow Examples
+-------------------
+
+- `tune_mnist_ray <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/tune_mnist_ray.py>`__:
+   A basic example of tuning a TensorFlow model on MNIST using the Trainable class.
+- `tune_mnist_ray_hyperband <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/tune_mnist_ray_hyperband.py>`__:
+   A basic example of tuning a TensorFlow model on MNIST using the Trainable class and the HyperBand scheduler.
+- `tune_mnist_async_hyperband <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/tune_mnist_async_hyperband.py>`__:
+   Example of tuning a TensorFlow model on MNIST using AsyncHyperBand.
+
+
+Contributed Examples
+--------------------
+
+- `pbt_tune_cifar10_with_keras <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/pbt_tune_cifar10_with_keras.py>`__:
+   A contributed example of tuning a Keras model on CIFAR10 with the PopulationBasedTraining scheduler.
+- `genetic_example <https://github.com/ray-project/ray/blob/master/python/ray/tune/examples/genetic_example.py>`__:
+   Optimizing the michalewicz function using the contributed GeneticSearch search algorithm with AsyncHyperBandScheduler.
diff --git a/python/ray/rllib/examples/legacy_multiagent/__init__.py b/python/ray/tune/examples/__init__.py
similarity index 100%
rename from python/ray/rllib/examples/legacy_multiagent/__init__.py
rename to python/ray/tune/examples/__init__.py
diff --git a/python/ray/tune/examples/async_hyperband_example.py b/python/ray/tune/examples/async_hyperband_example.py
index 2c368b4e3d05e..871e8c1718ea0 100644
--- a/python/ray/tune/examples/async_hyperband_example.py
+++ b/python/ray/tune/examples/async_hyperband_example.py
@@ -12,7 +12,7 @@
 import numpy as np
 
 import ray
-from ray.tune import Trainable, run_experiments
+from ray.tune import Trainable, run_experiments, sample_from
 from ray.tune.schedulers import AsyncHyperBandScheduler
 
 
@@ -23,7 +23,7 @@ class MyTrainableClass(Trainable):
     maximum reward value reached.
     """
 
-    def _setup(self):
+    def _setup(self, config):
         self.timestep = 0
 
     def _train(self):
@@ -76,8 +76,10 @@ def _restore(self, checkpoint_path):
                     "gpu": 0
                 },
                 "config": {
-                    "width": lambda spec: 10 + int(90 * random.random()),
-                    "height": lambda spec: int(100 * random.random()),
+                    "width": sample_from(
+                        lambda spec: 10 + int(90 * random.random())),
+                    "height": sample_from(
+                        lambda spec: int(100 * random.random())),
                 },
             }
         },
diff --git a/python/ray/tune/examples/hyperband_example.py b/python/ray/tune/examples/hyperband_example.py
index 94f603e8206cf..d403a0e0f8af1 100755
--- a/python/ray/tune/examples/hyperband_example.py
+++ b/python/ray/tune/examples/hyperband_example.py
@@ -12,7 +12,7 @@
 import numpy as np
 
 import ray
-from ray.tune import Trainable, run_experiments, Experiment
+from ray.tune import Trainable, run_experiments, Experiment, sample_from
 from ray.tune.schedulers import HyperBandScheduler
 
 
@@ -23,7 +23,7 @@ class MyTrainableClass(Trainable):
     maximum reward value reached.
     """
 
-    def _setup(self):
+    def _setup(self, config):
         self.timestep = 0
 
     def _train(self):
@@ -67,8 +67,8 @@ def _restore(self, checkpoint_path):
         num_samples=20,
         stop={"training_iteration": 1 if args.smoke_test else 99999},
         config={
-            "width": lambda spec: 10 + int(90 * random.random()),
-            "height": lambda spec: int(100 * random.random())
+            "width": sample_from(lambda spec: 10 + int(90 * random.random())),
+            "height": sample_from(lambda spec: int(100 * random.random()))
         })
 
     run_experiments(exp, scheduler=hyperband)
diff --git a/python/ray/tune/examples/hyperopt_example.py b/python/ray/tune/examples/hyperopt_example.py
index 6d61b1321e2ed..2898bf26d8539 100644
--- a/python/ray/tune/examples/hyperopt_example.py
+++ b/python/ray/tune/examples/hyperopt_example.py
@@ -48,7 +48,7 @@ def easy_objective(config, reporter):
             "run": "exp",
             "num_samples": 10 if args.smoke_test else 1000,
             "stop": {
-                "training_iteration": 100
+                "timesteps_total": 100
             },
         }
     }
diff --git a/python/ray/tune/examples/mnist_pytorch.py b/python/ray/tune/examples/mnist_pytorch.py
index bfd319bff3c9d..bec73f3d51249 100644
--- a/python/ray/tune/examples/mnist_pytorch.py
+++ b/python/ray/tune/examples/mnist_pytorch.py
@@ -182,8 +182,10 @@ def test():
                 "run": "train_mnist",
                 "num_samples": 1 if args.smoke_test else 10,
                 "config": {
-                    "lr": lambda spec: np.random.uniform(0.001, 0.1),
-                    "momentum": lambda spec: np.random.uniform(0.1, 0.9),
+                    "lr": tune.sample_from(
+                        lambda spec: np.random.uniform(0.001, 0.1)),
+                    "momentum": tune.sample_from(
+                        lambda spec: np.random.uniform(0.1, 0.9)),
                 }
             }
         },
diff --git a/python/ray/tune/examples/mnist_pytorch_trainable.py b/python/ray/tune/examples/mnist_pytorch_trainable.py
index 0d23c0cc21304..6005cd79c14fb 100644
--- a/python/ray/tune/examples/mnist_pytorch_trainable.py
+++ b/python/ray/tune/examples/mnist_pytorch_trainable.py
@@ -80,9 +80,9 @@ def forward(self, x):
 
 
 class TrainMNIST(Trainable):
-    def _setup(self):
-        args = self.config.pop("args")
-        vars(args).update(self.config)
+    def _setup(self, config):
+        args = config.pop("args")
+        vars(args).update(config)
         args.cuda = not args.no_cuda and torch.cuda.is_available()
 
         torch.manual_seed(args.seed)
@@ -159,12 +159,13 @@ def _train(self):
         self._train_iteration()
         return self._test()
 
-    def _save(self, path):
-        torch.save(self.model.state_dict(), os.path.join(path, "model.pth"))
-        return path
+    def _save(self, checkpoint_dir):
+        checkpoint_path = os.path.join(checkpoint_dir, "model.pth")
+        torch.save(self.model.state_dict(), checkpoint_path)
+        return checkpoint_path
 
-    def _restore(self, path):
-        self.model.load_state_dict(os.path.join(path, "model.pth"))
+    def _restore(self, checkpoint_path):
+        self.model.load_state_dict(checkpoint_path)
 
 
 if __name__ == '__main__':
@@ -194,8 +195,10 @@ def _restore(self, path):
                 "checkpoint_at_end": True,
                 "config": {
                     "args": args,
-                    "lr": lambda spec: np.random.uniform(0.001, 0.1),
-                    "momentum": lambda spec: np.random.uniform(0.1, 0.9),
+                    "lr": tune.sample_from(
+                        lambda spec: np.random.uniform(0.001, 0.1)),
+                    "momentum": tune.sample_from(
+                        lambda spec: np.random.uniform(0.1, 0.9)),
                 }
             }
         },
diff --git a/python/ray/tune/examples/pbt_example.py b/python/ray/tune/examples/pbt_example.py
index c958d2512e83a..3433e82f94eed 100755
--- a/python/ray/tune/examples/pbt_example.py
+++ b/python/ray/tune/examples/pbt_example.py
@@ -18,7 +18,7 @@
 class MyTrainableClass(Trainable):
     """Fake agent whose learning rate is determined by dummy factors."""
 
-    def _setup(self):
+    def _setup(self, config):
         self.timestep = 0
         self.current_value = 0.0
 
diff --git a/python/ray/tune/examples/pbt_ppo_example.py b/python/ray/tune/examples/pbt_ppo_example.py
index efd7ee4a89580..a81d4109f62c1 100755
--- a/python/ray/tune/examples/pbt_ppo_example.py
+++ b/python/ray/tune/examples/pbt_ppo_example.py
@@ -13,7 +13,7 @@
 import random
 
 import ray
-from ray.tune import run_experiments
+from ray.tune import run_experiments, sample_from
 from ray.tune.schedulers import PopulationBasedTraining
 
 if __name__ == "__main__":
@@ -63,12 +63,12 @@ def explore(config):
                     "clip_param": 0.2,
                     "lr": 1e-4,
                     # These params start off randomly drawn from a set.
-                    "num_sgd_iter":
-                        lambda spec: random.choice([10, 20, 30]),
-                    "sgd_minibatch_size":
-                        lambda spec: random.choice([128, 512, 2048]),
-                    "train_batch_size":
-                        lambda spec: random.choice([10000, 20000, 40000])
+                    "num_sgd_iter": sample_from(
+                        lambda spec: random.choice([10, 20, 30])),
+                    "sgd_minibatch_size": sample_from(
+                        lambda spec: random.choice([128, 512, 2048])),
+                    "train_batch_size": sample_from(
+                        lambda spec: random.choice([10000, 20000, 40000]))
                 },
             },
         },
diff --git a/python/ray/tune/examples/pbt_tune_cifar10_with_keras.py b/python/ray/tune/examples/pbt_tune_cifar10_with_keras.py
index 28575f5466824..692c967cf2946 100755
--- a/python/ray/tune/examples/pbt_tune_cifar10_with_keras.py
+++ b/python/ray/tune/examples/pbt_tune_cifar10_with_keras.py
@@ -23,7 +23,7 @@
 from tensorflow.python.keras.preprocessing.image import ImageDataGenerator
 
 import ray
-from ray.tune import grid_search, run_experiments
+from ray.tune import grid_search, run_experiments, sample_from
 from ray.tune import Trainable
 from ray.tune.schedulers import PopulationBasedTraining
 
@@ -105,7 +105,7 @@ def _build_model(self, input_shape):
         model = Model(inputs=x, outputs=y, name="model1")
         return model
 
-    def _setup(self):
+    def _setup(self, config):
         self.train_data, self.test_data = self._read_data()
         x_train = self.train_data[0]
         model = self._build_model(x_train.shape[1:])
@@ -193,7 +193,7 @@ def _stop(self):
             "epochs": 1,
             "batch_size": 64,
             "lr": grid_search([10**-4, 10**-5]),
-            "decay": lambda spec: spec.config.lr / 100.0,
+            "decay": sample_from(lambda spec: spec.config.lr / 100.0),
             "dropout": grid_search([0.25, 0.5]),
         },
         "num_samples": 4,
diff --git a/python/ray/tune/examples/tune_mnist_keras.py b/python/ray/tune/examples/tune_mnist_keras.py
index 32cfb371efc46..cbe9f626df6f4 100644
--- a/python/ray/tune/examples/tune_mnist_keras.py
+++ b/python/ray/tune/examples/tune_mnist_keras.py
@@ -105,6 +105,8 @@ def create_parser():
     parser = argparse.ArgumentParser(description='Keras MNIST Example')
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing")
+    parser.add_argument(
+        "--use-gpu", action="store_true", help="Use GPU in training.")
     parser.add_argument(
         '--jobs',
         type=int,
@@ -113,8 +115,8 @@ def create_parser():
     parser.add_argument(
         '--threads',
         type=int,
-        default=None,
-        help='threads used in operations (default: all)')
+        default=2,
+        help='threads used in operations (default: 2)')
     parser.add_argument(
         '--steps',
         type=float,
@@ -185,11 +187,19 @@ def create_parser():
                 },
                 "run": "train_mnist",
                 "num_samples": 1 if args.smoke_test else 10,
+                "trial_resources": {
+                    "cpu": args.threads,
+                    "gpu": 0.5 if args.use_gpu else 0
+                },
                 "config": {
-                    "lr": lambda spec: np.random.uniform(0.001, 0.1),
-                    "momentum": lambda spec: np.random.uniform(0.1, 0.9),
-                    "hidden": lambda spec: np.random.randint(32, 512),
-                    "dropout1": lambda spec: np.random.uniform(0.2, 0.8),
+                    "lr": tune.sample_from(
+                        lambda spec: np.random.uniform(0.001, 0.1)),
+                    "momentum": tune.sample_from(
+                        lambda spec: np.random.uniform(0.1, 0.9)),
+                    "hidden": tune.sample_from(
+                        lambda spec: np.random.randint(32, 512)),
+                    "dropout1": tune.sample_from(
+                        lambda spec: np.random.uniform(0.2, 0.8)),
                 }
             }
         },
diff --git a/python/ray/tune/examples/tune_mnist_ray.py b/python/ray/tune/examples/tune_mnist_ray.py
index e806a1a68ac8e..e56ebd10f5ebc 100755
--- a/python/ray/tune/examples/tune_mnist_ray.py
+++ b/python/ray/tune/examples/tune_mnist_ray.py
@@ -42,7 +42,7 @@
 
 FLAGS = None
 status_reporter = None  # used to report training status back to Ray
-activation_fn = None  # e.g. tf.nn.relu
+activation_fn = tf.nn.relu  # e.g. tf.nn.relu
 
 
 def deepnn(x):
diff --git a/python/ray/tune/examples/tune_mnist_ray_hyperband.py b/python/ray/tune/examples/tune_mnist_ray_hyperband.py
index 29939ff243085..bce19deca6859 100755
--- a/python/ray/tune/examples/tune_mnist_ray_hyperband.py
+++ b/python/ray/tune/examples/tune_mnist_ray_hyperband.py
@@ -31,7 +31,7 @@
 
 import ray
 from ray.tune import grid_search, run_experiments, register_trainable, \
-    Trainable
+    Trainable, sample_from
 from ray.tune.schedulers import HyperBandScheduler
 from tensorflow.examples.tutorials.mnist import input_data
 
@@ -128,7 +128,7 @@ def bias_variable(shape):
 class TrainMNIST(Trainable):
     """Example MNIST trainable."""
 
-    def _setup(self):
+    def _setup(self, config):
         global activation_fn
 
         self.timestep = 0
@@ -148,7 +148,7 @@ def _setup(self):
         self.x = tf.placeholder(tf.float32, [None, 784])
         self.y_ = tf.placeholder(tf.float32, [None, 10])
 
-        activation_fn = getattr(tf.nn, self.config['activation'])
+        activation_fn = getattr(tf.nn, config['activation'])
 
         # Build the graph for the deep net
         y_conv, self.keep_prob = setupCNN(self.x)
@@ -160,7 +160,7 @@ def _setup(self):
 
         with tf.name_scope('adam_optimizer'):
             train_step = tf.train.AdamOptimizer(
-                self.config['learning_rate']).minimize(cross_entropy)
+                config['learning_rate']).minimize(cross_entropy)
 
         self.train_step = train_step
 
@@ -221,7 +221,8 @@ def _restore(self, path):
             'time_total_s': 600,
         },
         'config': {
-            'learning_rate': lambda spec: 10**np.random.uniform(-5, -3),
+            'learning_rate': sample_from(
+                lambda spec: 10**np.random.uniform(-5, -3)),
             'activation': grid_search(['relu', 'elu', 'tanh']),
         },
         "num_samples": 10,
diff --git a/python/ray/tune/experiment.py b/python/ray/tune/experiment.py
index 390a66193d672..3a4ddc9c7aab8 100644
--- a/python/ray/tune/experiment.py
+++ b/python/ray/tune/experiment.py
@@ -85,7 +85,7 @@ def __init__(self,
                  repeat=1,
                  num_samples=1,
                  local_dir=None,
-                 upload_dir="",
+                 upload_dir=None,
                  checkpoint_freq=0,
                  checkpoint_at_end=False,
                  max_failures=3,
@@ -97,7 +97,7 @@ def __init__(self,
             "trial_resources": trial_resources,
             "num_samples": num_samples,
             "local_dir": local_dir or DEFAULT_RESULTS_DIR,
-            "upload_dir": upload_dir,
+            "upload_dir": upload_dir or "",  # argparse converts None to "null"
             "checkpoint_freq": checkpoint_freq,
             "checkpoint_at_end": checkpoint_at_end,
             "max_failures": max_failures,
diff --git a/python/ray/tune/function_runner.py b/python/ray/tune/function_runner.py
index d1704b6aa94fe..47593f2213bcd 100644
--- a/python/ray/tune/function_runner.py
+++ b/python/ray/tune/function_runner.py
@@ -14,11 +14,12 @@
 
 
 class StatusReporter(object):
-    """Object passed into your main() that you can report status through.
+    """Object passed into your function that you can report status through.
 
     Example:
-        >>> reporter = StatusReporter()
-        >>> reporter(timesteps_total=1)
+        >>> def trainable_function(config, reporter):
+        >>>     assert isinstance(reporter, StatusReporter)
+        >>>     reporter(timesteps_total=1)
     """
 
     def __init__(self):
@@ -33,6 +34,9 @@ def __call__(self, **kwargs):
 
         Args:
             kwargs: Latest training result status.
+
+        Example:
+            >>> reporter(mean_accuracy=1, training_iteration=4)
         """
 
         with self._lock:
@@ -90,10 +94,10 @@ class FunctionRunner(Trainable):
     _name = "func"
     _default_config = DEFAULT_CONFIG
 
-    def _setup(self):
+    def _setup(self, config):
         entrypoint = self._trainable_func()
         self._status_reporter = StatusReporter()
-        scrubbed_config = self.config.copy()
+        scrubbed_config = config.copy()
         for k in self._default_config:
             if k in scrubbed_config:
                 del scrubbed_config[k]
diff --git a/python/ray/tune/log_sync.py b/python/ray/tune/log_sync.py
index 2e18a86582085..109c11a01707f 100644
--- a/python/ray/tune/log_sync.py
+++ b/python/ray/tune/log_sync.py
@@ -107,11 +107,13 @@ def sync_now(self, force=False):
             if not distutils.spawn.find_executable("rsync"):
                 logger.error("Log sync requires rsync to be installed.")
                 return
+            source = '{}@{}:{}/'.format(ssh_user, self.worker_ip,
+                                        self.local_dir)
+            target = '{}/'.format(self.local_dir)
             worker_to_local_sync_cmd = ((
-                """rsync -avz -e "ssh -i {} -o ConnectTimeout=120s """
-                """-o StrictHostKeyChecking=no" '{}@{}:{}/' '{}/'""").format(
-                    quote(ssh_key), ssh_user, self.worker_ip,
-                    quote(self.local_dir), quote(self.local_dir)))
+                """rsync -savz -e "ssh -i {} -o ConnectTimeout=120s """
+                """-o StrictHostKeyChecking=no" {} {}""").format(
+                    quote(ssh_key), quote(source), quote(target)))
 
         if self.remote_dir:
             if self.remote_dir.startswith(S3_PREFIX):
diff --git a/python/ray/tune/logger.py b/python/ray/tune/logger.py
index f73aa4a1ef8ce..183ba6490b979 100644
--- a/python/ray/tune/logger.py
+++ b/python/ray/tune/logger.py
@@ -9,6 +9,7 @@
 import os
 import yaml
 
+import ray.cloudpickle as cloudpickle
 from ray.tune.log_sync import get_syncer
 from ray.tune.result import NODE_IP, TRAINING_ITERATION, TIME_TOTAL_S, \
     TIMESTEPS_TOTAL
@@ -97,7 +98,15 @@ class _JsonLogger(Logger):
     def _init(self):
         config_out = os.path.join(self.logdir, "params.json")
         with open(config_out, "w") as f:
-            json.dump(self.config, f, sort_keys=True, cls=_SafeFallbackEncoder)
+            json.dump(
+                self.config,
+                f,
+                indent=2,
+                sort_keys=True,
+                cls=_SafeFallbackEncoder)
+        config_pkl = os.path.join(self.logdir, "params.pkl")
+        with open(config_pkl, "wb") as f:
+            cloudpickle.dump(self.config, f)
         local_file = os.path.join(self.logdir, "result.json")
         self.local_out = open(local_file, "w")
 
diff --git a/python/ray/tune/ray_trial_executor.py b/python/ray/tune/ray_trial_executor.py
index 86f09cda34d8e..6b107b17c82f9 100644
--- a/python/ray/tune/ray_trial_executor.py
+++ b/python/ray/tune/ray_trial_executor.py
@@ -29,6 +29,8 @@ def __init__(self, queue_trials=False):
         self._avail_resources = Resources(cpu=0, gpu=0)
         self._committed_resources = Resources(cpu=0, gpu=0)
         self._resources_initialized = False
+        if ray.is_initialized():
+            self._update_avail_resources()
 
     def _setup_runner(self, trial):
         cls = ray.remote(
@@ -108,19 +110,27 @@ def _stop_trial(self, trial, error=False, error_msg=None,
         if stop_logger:
             trial.close_logger()
 
-    def start_trial(self, trial, checkpoint_obj=None):
-        """Starts the trial."""
+    def start_trial(self, trial, checkpoint=None):
+        """Starts the trial.
+
+        Will not return resources if trial repeatedly fails on start.
+
+        Args:
+            trial (Trial): Trial to be started.
+            checkpoint (Checkpoint): A Python object or path storing the state
+                of trial.
+        """
 
         self._commit_resources(trial.resources)
         try:
-            self._start_trial(trial, checkpoint_obj)
+            self._start_trial(trial, checkpoint)
         except Exception:
             logger.exception("Error stopping runner - retrying...")
             error_msg = traceback.format_exc()
             time.sleep(2)
             self._stop_trial(trial, error=True, error_msg=error_msg)
             try:
-                self._start_trial(trial)
+                self._start_trial(trial, checkpoint)
             except Exception:
                 logger.exception("Error starting runner, aborting!")
                 error_msg = traceback.format_exc()
@@ -138,6 +148,7 @@ def stop_trial(self, trial, error=False, error_msg=None, stop_logger=True):
         self._stop_trial(
             trial, error=error, error_msg=error_msg, stop_logger=stop_logger)
         if prior_status == Trial.RUNNING:
+            logger.debug("Returning resources for this trial.")
             self._return_resources(trial.resources)
             out = self._find_item(self._running, trial)
             for result_id in out:
@@ -213,19 +224,9 @@ def _return_resources(self, resources):
         assert self._committed_resources.gpu >= 0
 
     def _update_avail_resources(self):
-        clients = ray.global_state.client_table()
-        if ray.worker.global_worker.use_raylet:
-            # TODO(rliaw): Remove once raylet flag is swapped
-            num_cpus = sum(cl['Resources']['CPU'] for cl in clients)
-            num_gpus = sum(cl['Resources'].get('GPU', 0) for cl in clients)
-        else:
-            local_schedulers = [
-                entry for client in clients.values() for entry in client
-                if (entry['ClientType'] == 'local_scheduler'
-                    and not entry['Deleted'])
-            ]
-            num_cpus = sum(ls['CPU'] for ls in local_schedulers)
-            num_gpus = sum(ls.get('GPU', 0) for ls in local_schedulers)
+        resources = ray.global_state.cluster_resources()
+        num_cpus = resources["CPU"]
+        num_gpus = resources["GPU"]
         self._avail_resources = Resources(int(num_cpus), int(num_gpus))
         self._resources_initialized = True
 
@@ -267,7 +268,16 @@ def debug_string(self):
                 self._committed_resources.cpu, self._avail_resources.cpu,
                 self._committed_resources.gpu, self._avail_resources.gpu)
         else:
-            return ""
+            return "Resources requested: ?"
+
+    def resource_string(self):
+        """Returns a string describing the total resources available."""
+
+        if self._resources_initialized:
+            return "{} CPUs, {} GPUs".format(self._avail_resources.cpu,
+                                             self._avail_resources.gpu)
+        else:
+            return "? CPUs, ? GPUs"
 
     def on_step_begin(self):
         """Before step() called, update the available resources."""
@@ -277,6 +287,7 @@ def on_step_begin(self):
     def save(self, trial, storage=Checkpoint.DISK):
         """Saves the trial's state to a checkpoint."""
         trial._checkpoint.storage = storage
+        trial._checkpoint.last_result = trial.last_result
         if storage == Checkpoint.MEMORY:
             trial._checkpoint.value = trial.runner.save_to_object.remote()
         else:
@@ -300,6 +311,8 @@ def restore(self, trial, checkpoint=None):
                 ray.get(trial.runner.restore_from_object.remote(value))
             else:
                 ray.get(trial.runner.restore.remote(value))
+            trial.last_result = checkpoint.last_result
+
             return True
         except Exception:
             logger.exception("Error restoring runner.")
diff --git a/python/ray/tune/result.py b/python/ray/tune/result.py
index ec307eaed8fb8..0d5aeb0d0618c 100644
--- a/python/ray/tune/result.py
+++ b/python/ray/tune/result.py
@@ -4,6 +4,8 @@
 
 import os
 
+# yapf: disable
+# __sphinx_doc_begin__
 # (Optional/Auto-filled) training is terminated. Filled only if not provided.
 DONE = "done"
 
@@ -16,16 +18,16 @@
 # (Auto-filled) The pid of the training process.
 PID = "pid"
 
-# Number of timesteps in this iteration.
+# Number of episodes in this iteration.
 EPISODES_THIS_ITER = "episodes_this_iter"
 
-# (Optional/Auto-filled) Accumulated time in seconds for this experiment.
+# (Optional/Auto-filled) Accumulated number of episodes for this experiment.
 EPISODES_TOTAL = "episodes_total"
 
 # Number of timesteps in this iteration.
 TIMESTEPS_THIS_ITER = "timesteps_this_iter"
 
-# (Optional/Auto-filled) Accumulated time in seconds for this experiment.
+# (Auto-filled) Accumulated number of timesteps for this entire experiment.
 TIMESTEPS_TOTAL = "timesteps_total"
 
 # (Auto-filled) Time in seconds this iteration took to run.
@@ -35,11 +37,14 @@
 # (Auto-filled) Accumulated time in seconds for this entire experiment.
 TIME_TOTAL_S = "time_total_s"
 
-# (Auto-filled) The index of thistraining iteration.
+# (Auto-filled) The index of this training iteration.
 TRAINING_ITERATION = "training_iteration"
+# __sphinx_doc_end__
+# yapf: enable
 
 # Where Tune writes result files by default
-DEFAULT_RESULTS_DIR = os.path.expanduser("~/ray_results")
+DEFAULT_RESULTS_DIR = (os.environ.get("TUNE_RESULT_DIR")
+                       or os.path.expanduser("~/ray_results"))
 
 # Meta file about status under each experiment directory, can be
 # parsed by automlboard if exists.
diff --git a/python/ray/tune/schedulers/hyperband.py b/python/ray/tune/schedulers/hyperband.py
index 7e2f8f27e278f..71c69b3063a2b 100644
--- a/python/ray/tune/schedulers/hyperband.py
+++ b/python/ray/tune/schedulers/hyperband.py
@@ -50,7 +50,10 @@ class HyperBandScheduler(FIFOScheduler):
     For example, to limit trials to 10 minutes and early stop based on the
     `episode_mean_reward` attr, construct:
 
-    ``HyperBand('time_total_s', 'episode_reward_mean', 600)``
+    ``HyperBand('time_total_s', 'episode_reward_mean', max_t=600)``
+
+    Note that Tune's stopping criteria will be applied in conjunction with
+    HyperBand's early stopping mechanisms.
 
     See also: https://people.eecs.berkeley.edu/~kjamieson/hyperband.html
 
diff --git a/python/ray/tune/suggest/__init__.py b/python/ray/tune/suggest/__init__.py
index f0146ca5e7992..9f4a5e6a7ad06 100644
--- a/python/ray/tune/suggest/__init__.py
+++ b/python/ray/tune/suggest/__init__.py
@@ -2,9 +2,15 @@
 from ray.tune.suggest.basic_variant import BasicVariantGenerator
 from ray.tune.suggest.suggestion import SuggestionAlgorithm
 from ray.tune.suggest.hyperopt import HyperOptSearch
-from ray.tune.suggest.variant_generator import grid_search, function
+from ray.tune.suggest.variant_generator import grid_search, function, \
+    sample_from
 
 __all__ = [
-    "SearchAlgorithm", "BasicVariantGenerator", "HyperOptSearch",
-    "SuggestionAlgorithm", "grid_search", "function"
+    "SearchAlgorithm",
+    "BasicVariantGenerator",
+    "HyperOptSearch",
+    "SuggestionAlgorithm",
+    "grid_search",
+    "function",
+    "sample_from",
 ]
diff --git a/python/ray/tune/suggest/hyperopt.py b/python/ray/tune/suggest/hyperopt.py
index 45fe9753e0ea0..2c1c1317616d3 100644
--- a/python/ray/tune/suggest/hyperopt.py
+++ b/python/ray/tune/suggest/hyperopt.py
@@ -4,9 +4,13 @@
 
 import numpy as np
 import copy
+import logging
+
 try:
+    hyperopt_logger = logging.getLogger("hyperopt")
+    hyperopt_logger.setLevel(logging.WARNING)
     import hyperopt as hpo
-except Exception as e:
+except Exception:
     hpo = None
 
 from ray.tune.error import TuneError
@@ -47,7 +51,6 @@ class HyperOptSearch(SuggestionAlgorithm):
         >>> }
         >>> algo = HyperOptSearch(
         >>>     space, max_concurrent=4, reward_attr="neg_mean_loss")
-        >>> algo.add_configurations(config)
     """
 
     def __init__(self,
diff --git a/python/ray/tune/suggest/variant_generator.py b/python/ray/tune/suggest/variant_generator.py
index 98b830754093e..d57b586c0e5d2 100644
--- a/python/ray/tune/suggest/variant_generator.py
+++ b/python/ray/tune/suggest/variant_generator.py
@@ -3,12 +3,15 @@
 from __future__ import print_function
 
 import copy
+import logging
 import numpy
 import random
 import types
 
 from ray.tune import TuneError
 
+logger = logging.getLogger(__name__)
+
 
 def generate_variants(unresolved_spec):
     """Generates variants from a spec (dict) with unresolved values.
@@ -55,8 +58,29 @@ def grid_search(values):
     return {"grid_search": values}
 
 
+class sample_from(object):
+    """Specify that tune should sample configuration values from this function.
+
+    The use of function arguments in tune configs must be disambiguated by
+    either wrapped the function in tune.eval() or tune.function().
+
+    Arguments:
+        func: An callable function to draw a sample from.
+    """
+
+    def __init__(self, func):
+        self.func = func
+
+
 class function(object):
-    """Wraps `func` to make sure it is not expanded during resolution."""
+    """Wraps `func` to make sure it is not expanded during resolution.
+
+    The use of function arguments in tune configs must be disambiguated by
+    either wrapped the function in tune.eval() or tune.function().
+
+    Arguments:
+        func: A function literal.
+    """
 
     def __init__(self, func):
         self.func = func
@@ -155,6 +179,11 @@ def _resolve_lambda_vars(spec, lambda_vars):
                 value = fn(_UnresolvedAccessGuard(spec))
             except RecursiveDependencyError as e:
                 error = e
+            except Exception:
+                raise ValueError(
+                    "Failed to evaluate expression: {}: {}".format(path, fn) +
+                    ". If you meant to pass this as a function literal, use "
+                    "tune.function() to escape it.")
             else:
                 _assign_value(spec, path, value)
                 resolved[path] = value
@@ -198,8 +227,17 @@ def _is_resolved(v):
 
 def _try_resolve(v):
     if isinstance(v, types.FunctionType):
-        # Lambda function
+        logger.warn(
+            "Deprecation warning: Function values are ambiguous in Tune "
+            "configuations. Either wrap the function with "
+            "`tune.function(func)` to specify a function literal, or "
+            "`tune.sample_from(func)` to tell Tune to "
+            "sample values from the function during variant generation: "
+            "{}".format(v))
         return False, v
+    elif isinstance(v, sample_from):
+        # Function to sample from
+        return False, v.func
     elif isinstance(v, dict) and len(v) == 1 and "eval" in v:
         # Lambda function in eval syntax
         return False, lambda spec: eval(
diff --git a/python/ray/tune/test/cluster_tests.py b/python/ray/tune/test/cluster_tests.py
new file mode 100644
index 0000000000000..59f12181b8ff9
--- /dev/null
+++ b/python/ray/tune/test/cluster_tests.py
@@ -0,0 +1,242 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import json
+import pytest
+try:
+    import pytest_timeout
+except ImportError:
+    pytest_timeout = None
+
+import ray
+from ray.rllib import _register_all
+from ray.test.cluster_utils import Cluster
+from ray.tune.error import TuneError
+from ray.tune.trial import Trial
+from ray.tune.trial_runner import TrialRunner
+from ray.tune.suggest import BasicVariantGenerator
+
+
+def _start_new_cluster():
+    cluster = Cluster(
+        initialize_head=True,
+        connect=True,
+        head_node_args={
+            "resources": dict(CPU=1),
+            "_internal_config": json.dumps({
+                "num_heartbeats_timeout": 10
+            })
+        })
+    # Pytest doesn't play nicely with imports
+    _register_all()
+    return cluster
+
+
+@pytest.fixture
+def start_connected_cluster():
+    # Start the Ray processes.
+    cluster = _start_new_cluster()
+    yield cluster
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+    cluster.shutdown()
+
+
+@pytest.fixture
+def start_connected_emptyhead_cluster():
+    """Starts head with no resources."""
+
+    cluster = Cluster(
+        initialize_head=True,
+        connect=True,
+        head_node_args={
+            "resources": dict(CPU=0),
+            "_internal_config": json.dumps({
+                "num_heartbeats_timeout": 10
+            })
+        })
+    # Pytest doesn't play nicely with imports
+    _register_all()
+    yield cluster
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+    cluster.shutdown()
+
+
+def test_counting_resources(start_connected_cluster):
+    """Tests that Tune accounting is consistent with actual cluster."""
+
+    cluster = start_connected_cluster
+    nodes = []
+    assert ray.global_state.cluster_resources()["CPU"] == 1
+    runner = TrialRunner(BasicVariantGenerator())
+    kwargs = {"stopping_criterion": {"training_iteration": 10}}
+
+    trials = [Trial("__fake", **kwargs), Trial("__fake", **kwargs)]
+    for t in trials:
+        runner.add_trial(t)
+
+    runner.step()  # run 1
+    nodes += [cluster.add_node(resources=dict(CPU=1))]
+    assert cluster.wait_for_nodes()
+    assert ray.global_state.cluster_resources()["CPU"] == 2
+    cluster.remove_node(nodes.pop())
+    assert cluster.wait_for_nodes()
+    assert ray.global_state.cluster_resources()["CPU"] == 1
+    runner.step()  # run 2
+    assert sum(t.status == Trial.RUNNING for t in runner.get_trials()) == 1
+
+    for i in range(5):
+        nodes += [cluster.add_node(resources=dict(CPU=1))]
+    assert cluster.wait_for_nodes()
+    assert ray.global_state.cluster_resources()["CPU"] == 6
+
+    runner.step()  # 1 result
+    assert sum(t.status == Trial.RUNNING for t in runner.get_trials()) == 2
+
+
+@pytest.mark.skip("Add this test once reconstruction is fixed")
+@pytest.mark.skipif(
+    pytest_timeout is None,
+    reason="Timeout package not installed; skipping test.")
+@pytest.mark.timeout(10, method="thread")
+def test_remove_node_before_result(start_connected_cluster):
+    """Removing a node should cause a Trial to be requeued."""
+    cluster = start_connected_cluster
+    node = cluster.add_node(resources=dict(CPU=1))
+    # TODO(rliaw): Make blocking an option?
+    assert cluster.wait_for_nodes()
+
+    runner = TrialRunner(BasicVariantGenerator())
+    kwargs = {"stopping_criterion": {"training_iteration": 3}}
+    trials = [Trial("__fake", **kwargs), Trial("__fake", **kwargs)]
+    for t in trials:
+        runner.add_trial(t)
+
+    runner.step()  # run 1
+    runner.step()  # run 2
+    assert all(t.status == Trial.RUNNING for t in trials)
+
+    runner.step()  # 1 result
+
+    cluster.remove_node(node)
+    cluster.wait_for_nodes()
+    assert ray.global_state.cluster_resources["CPU"] == 1
+
+    runner.step()  # recover
+    for i in range(5):
+        runner.step()
+    assert all(t.status == Trial.TERMINATED for t in trials)
+
+    with pytest.raises(TuneError):
+        runner.step()
+
+
+@pytest.mark.skipif(
+    pytest_timeout is None,
+    reason="Timeout package not installed; skipping test.")
+@pytest.mark.timeout(120, method="thread")
+def test_trial_migration(start_connected_emptyhead_cluster):
+    """Removing a node while cluster has space should migrate trial.
+
+    The trial state should also be consistent with the checkpoint.
+    """
+    cluster = start_connected_emptyhead_cluster
+    node = cluster.add_node(resources=dict(CPU=1))
+    assert cluster.wait_for_nodes()
+
+    runner = TrialRunner(BasicVariantGenerator())
+    kwargs = {
+        "stopping_criterion": {
+            "training_iteration": 3
+        },
+        "checkpoint_freq": 2,
+        "max_failures": 2
+    }
+
+    # Test recovery of trial that hasn't been checkpointed
+    t = Trial("__fake", **kwargs)
+    runner.add_trial(t)
+    runner.step()  # start
+    runner.step()  # 1 result
+    assert t.last_result is not None
+    node2 = cluster.add_node(resources=dict(CPU=1))
+    cluster.remove_node(node)
+    assert cluster.wait_for_nodes()
+    runner.step()  # Recovery step
+
+    # TODO(rliaw): This assertion is not critical but will not pass
+    #   because checkpoint handling is messy and should be refactored
+    #   rather than hotfixed.
+    # assert t.last_result is None, "Trial result not restored correctly."
+    for i in range(3):
+        runner.step()
+
+    assert t.status == Trial.TERMINATED
+
+    # Test recovery of trial that has been checkpointed
+    t2 = Trial("__fake", **kwargs)
+    runner.add_trial(t2)
+    runner.step()  # start
+    runner.step()  # 1 result
+    runner.step()  # 2 result and checkpoint
+    assert t2.has_checkpoint()
+    node3 = cluster.add_node(resources=dict(CPU=1))
+    cluster.remove_node(node2)
+    assert cluster.wait_for_nodes()
+    runner.step()  # Recovery step
+    assert t2.last_result["training_iteration"] == 2
+    for i in range(1):
+        runner.step()
+
+    assert t2.status == Trial.TERMINATED
+
+    # Test recovery of trial that won't be checkpointed
+    t3 = Trial("__fake", **{"stopping_criterion": {"training_iteration": 3}})
+    runner.add_trial(t3)
+    runner.step()  # start
+    runner.step()  # 1 result
+    cluster.add_node(resources=dict(CPU=1))
+    cluster.remove_node(node3)
+    assert cluster.wait_for_nodes()
+    runner.step()  # Error handling step
+    assert t3.status == Trial.ERROR
+
+    with pytest.raises(TuneError):
+        runner.step()
+
+
+@pytest.mark.skipif(
+    pytest_timeout is None,
+    reason="Timeout package not installed; skipping test.")
+@pytest.mark.timeout(120, method="thread")
+def test_trial_requeue(start_connected_emptyhead_cluster):
+    """Removing a node in full cluster causes Trial to be requeued."""
+    cluster = start_connected_emptyhead_cluster
+    node = cluster.add_node(resources=dict(CPU=1))
+    assert cluster.wait_for_nodes()
+
+    runner = TrialRunner(BasicVariantGenerator())
+    kwargs = {
+        "stopping_criterion": {
+            "training_iteration": 5
+        },
+        "checkpoint_freq": 1,
+        "max_failures": 1
+    }
+
+    trials = [Trial("__fake", **kwargs), Trial("__fake", **kwargs)]
+    for t in trials:
+        runner.add_trial(t)
+
+    runner.step()  # start
+    runner.step()  # 1 result
+
+    cluster.remove_node(node)
+    assert cluster.wait_for_nodes()
+    runner.step()
+    assert all(t.status == Trial.PENDING for t in trials)
+
+    with pytest.raises(TuneError):
+        runner.step()
diff --git a/python/ray/tune/test/ray_trial_executor_test.py b/python/ray/tune/test/ray_trial_executor_test.py
index 35c413e717bb4..86c4bb189595f 100644
--- a/python/ray/tune/test/ray_trial_executor_test.py
+++ b/python/ray/tune/test/ray_trial_executor_test.py
@@ -9,8 +9,9 @@
 from ray.rllib import _register_all
 from ray.tune import Trainable
 from ray.tune.ray_trial_executor import RayTrialExecutor
+from ray.tune.registry import _global_registry, TRAINABLE_CLASS
 from ray.tune.suggest import BasicVariantGenerator
-from ray.tune.trial import Trial, Checkpoint
+from ray.tune.trial import Trial, Checkpoint, Resources
 
 
 class RayTrialExecutorTest(unittest.TestCase):
@@ -50,6 +51,12 @@ def testPauseResume(self):
         self.trial_executor.stop_trial(trial)
         self.assertEqual(Trial.TERMINATED, trial.status)
 
+    def testStartFailure(self):
+        _global_registry.register(TRAINABLE_CLASS, "asdf", None)
+        trial = Trial("asdf", resources=Resources(1, 0))
+        self.trial_executor.start_trial(trial)
+        self.assertEqual(Trial.ERROR, trial.status)
+
     def testPauseResume2(self):
         """Tests that pausing works for trials being processed."""
         trial = Trial("__fake")
diff --git a/python/ray/tune/test/trial_runner_test.py b/python/ray/tune/test/trial_runner_test.py
index 1e4c0509dc151..8e4aa2cea1481 100644
--- a/python/ray/tune/test/trial_runner_test.py
+++ b/python/ray/tune/test/trial_runner_test.py
@@ -3,6 +3,7 @@
 from __future__ import print_function
 
 import os
+import sys
 import time
 import unittest
 
@@ -14,15 +15,22 @@
 from ray.tune.ray_trial_executor import RayTrialExecutor
 from ray.tune.schedulers import TrialScheduler, FIFOScheduler
 from ray.tune.registry import _global_registry, TRAINABLE_CLASS
-from ray.tune.result import DEFAULT_RESULTS_DIR, TIMESTEPS_TOTAL, DONE
+from ray.tune.result import (DEFAULT_RESULTS_DIR, TIMESTEPS_TOTAL, DONE,
+                             EPISODES_TOTAL)
 from ray.tune.util import pin_in_object_store, get_pinned_object
 from ray.tune.experiment import Experiment
 from ray.tune.trial import Trial, Resources
 from ray.tune.trial_runner import TrialRunner
 from ray.tune.suggest import grid_search, BasicVariantGenerator
-from ray.tune.suggest.suggestion import _MockSuggestionAlgorithm
+from ray.tune.suggest.suggestion import (_MockSuggestionAlgorithm,
+                                         SuggestionAlgorithm)
 from ray.tune.suggest.variant_generator import RecursiveDependencyError
 
+if sys.version_info >= (3, 3):
+    from unittest.mock import patch
+else:
+    from mock import patch
+
 
 class TrainableFunctionApiTest(unittest.TestCase):
     def setUp(self):
@@ -106,7 +114,7 @@ def default_resource_request(cls, config):
                 return Resources(cpu=config["cpu"], gpu=config["gpu"])
 
             def _train(self):
-                return dict(timesteps_this_iter=1, done=True)
+                return {"timesteps_this_iter": 1, "done": True}
 
         register_trainable("B", B)
 
@@ -184,6 +192,21 @@ def train(config, reporter):
             }
         })
 
+    def testUploadDirNone(self):
+        def train(config, reporter):
+            reporter(timesteps_total=1)
+
+        [trial] = run_experiments({
+            "foo": {
+                "run": train,
+                "upload_dir": None,
+                "config": {
+                    "a": "b"
+                },
+            }
+        })
+        self.assertFalse(trial.upload_dir)
+
     def testLogdirStartingWithTilde(self):
         local_dir = '~/ray_results/local_dir'
 
@@ -418,10 +441,25 @@ def train(config, reporter):
         })
         self.assertIsNone(trial.last_result[TIMESTEPS_TOTAL])
 
-        def train3(config, reporter):
+        def train2(config, reporter):
             for i in range(10):
                 reporter(timesteps_total=5)
 
+        [trial2] = run_experiments({
+            "foo": {
+                "run": train2,
+                "config": {
+                    "script_min_iter_time_s": 0,
+                },
+            }
+        })
+        self.assertEqual(trial2.last_result[TIMESTEPS_TOTAL], 5)
+        self.assertEqual(trial2.last_result["timesteps_this_iter"], 0)
+
+        def train3(config, reporter):
+            for i in range(10):
+                reporter(timesteps_this_iter=0, episodes_this_iter=0)
+
         [trial3] = run_experiments({
             "foo": {
                 "run": train3,
@@ -430,8 +468,73 @@ def train3(config, reporter):
                 },
             }
         })
-        self.assertEqual(trial3.last_result[TIMESTEPS_TOTAL], 5)
-        self.assertEqual(trial3.last_result["timesteps_this_iter"], 0)
+        self.assertEqual(trial3.last_result[TIMESTEPS_TOTAL], 0)
+        self.assertEqual(trial3.last_result[EPISODES_TOTAL], 0)
+
+    def testCheckpointDict(self):
+        class TestTrain(Trainable):
+            def _setup(self, config):
+                self.state = {"hi": 1}
+
+            def _train(self):
+                return {"timesteps_this_iter": 1, "done": True}
+
+            def _save(self, path):
+                return self.state
+
+            def _restore(self, state):
+                self.state = state
+
+        test_trainable = TestTrain()
+        result = test_trainable.save()
+        test_trainable.state["hi"] = 2
+        test_trainable.restore(result)
+        self.assertEqual(test_trainable.state["hi"], 1)
+
+        trials = run_experiments({
+            "foo": {
+                "run": TestTrain,
+                "checkpoint_at_end": True
+            }
+        })
+        for trial in trials:
+            self.assertEqual(trial.status, Trial.TERMINATED)
+            self.assertTrue(trial.has_checkpoint())
+
+    def testMultipleCheckpoints(self):
+        class TestTrain(Trainable):
+            def _setup(self, config):
+                self.state = {"hi": 1, "iter": 0}
+
+            def _train(self):
+                self.state["iter"] += 1
+                return {"timesteps_this_iter": 1, "done": True}
+
+            def _save(self, path):
+                return self.state
+
+            def _restore(self, state):
+                self.state = state
+
+        test_trainable = TestTrain()
+        checkpoint_1 = test_trainable.save()
+        test_trainable.train()
+        checkpoint_2 = test_trainable.save()
+        self.assertNotEqual(checkpoint_1, checkpoint_2)
+        test_trainable.restore(checkpoint_2)
+        self.assertEqual(test_trainable.state["iter"], 1)
+        test_trainable.restore(checkpoint_1)
+        self.assertEqual(test_trainable.state["iter"], 0)
+
+        trials = run_experiments({
+            "foo": {
+                "run": TestTrain,
+                "checkpoint_at_end": True
+            }
+        })
+        for trial in trials:
+            self.assertEqual(trial.status, Trial.TERMINATED)
+            self.assertTrue(trial.has_checkpoint())
 
 
 class RunExperimentTest(unittest.TestCase):
@@ -538,7 +641,7 @@ def train(config, reporter):
 
         class B(Trainable):
             def _train(self):
-                return dict(timesteps_this_iter=1, done=True)
+                return {"timesteps_this_iter": 1, "done": True}
 
         register_trainable("f1", train)
         trials = run_experiments({
@@ -558,10 +661,13 @@ def _train(self):
     def testCheckpointAtEnd(self):
         class train(Trainable):
             def _train(self):
-                return dict(timesteps_this_iter=1, done=True)
+                return {"timesteps_this_iter": 1, "done": True}
 
             def _save(self, path):
-                return path
+                checkpoint = path + "/checkpoint"
+                with open(checkpoint, "w") as f:
+                    f.write("OK")
+                return checkpoint
 
         trials = run_experiments({
             "foo": {
@@ -745,6 +851,25 @@ def testMaxConcurrentSuggestions(self):
         self.assertEqual(len(searcher.next_trials()), 0)
 
 
+def create_mock_components():
+    class _MockScheduler(FIFOScheduler):
+        errored_trials = []
+
+        def on_trial_error(self, trial_runner, trial):
+            self.errored_trials += [trial]
+
+    class _MockSearchAlg(BasicVariantGenerator):
+        errored_trials = []
+
+        def on_trial_complete(self, trial_id, error=False, **kwargs):
+            if error:
+                self.errored_trials += [trial_id]
+
+    searchalg = _MockSearchAlg()
+    scheduler = _MockScheduler()
+    return searchalg, scheduler
+
+
 class TrialRunnerTest(unittest.TestCase):
     def tearDown(self):
         ray.shutdown()
@@ -789,16 +914,6 @@ def train(config, reporter):
                 self.assertLessEqual(len(trial.logdir), 200)
                 trial_executor.stop_trial(trial)
 
-    def testTrialErrorOnStart(self):
-        ray.init()
-        trial_executor = RayTrialExecutor()
-        _global_registry.register(TRAINABLE_CLASS, "asdf", None)
-        trial = Trial("asdf", resources=Resources(1, 0))
-        try:
-            trial_executor.start_trial(trial)
-        except Exception as e:
-            self.assertIn("a class", str(e))
-
     def testExtraResources(self):
         ray.init(num_cpus=4, num_gpus=2)
         runner = TrialRunner(BasicVariantGenerator())
@@ -821,7 +936,7 @@ def testExtraResources(self):
         self.assertEqual(trials[1].status, Trial.PENDING)
 
     def testFractionalGpus(self):
-        ray.init(num_cpus=4, num_gpus=1, use_raylet=True)
+        ray.init(num_cpus=4, num_gpus=1)
         runner = TrialRunner(BasicVariantGenerator())
         kwargs = {
             "resources": Resources(cpu=1, gpu=0.5),
@@ -901,6 +1016,30 @@ def testMultiStepRun(self):
         self.assertEqual(trials[0].status, Trial.RUNNING)
         self.assertEqual(trials[1].status, Trial.RUNNING)
 
+    def testMultiStepRun2(self):
+        """Checks that runner.step throws when overstepping."""
+        ray.init(num_cpus=1)
+        runner = TrialRunner(BasicVariantGenerator())
+        kwargs = {
+            "stopping_criterion": {
+                "training_iteration": 2
+            },
+            "resources": Resources(cpu=1, gpu=0),
+        }
+        trials = [Trial("__fake", **kwargs)]
+        for t in trials:
+            runner.add_trial(t)
+
+        runner.step()
+        self.assertEqual(trials[0].status, Trial.RUNNING)
+
+        runner.step()
+        self.assertEqual(trials[0].status, Trial.RUNNING)
+
+        runner.step()
+        self.assertEqual(trials[0].status, Trial.TERMINATED)
+        self.assertRaises(TuneError, runner.step)
+
     def testErrorHandling(self):
         ray.init(num_cpus=4, num_gpus=2)
         runner = TrialRunner(BasicVariantGenerator())
@@ -923,9 +1062,17 @@ def testErrorHandling(self):
         self.assertEqual(trials[0].status, Trial.ERROR)
         self.assertEqual(trials[1].status, Trial.RUNNING)
 
-    def testFailureRecoveryDisabled(self):
+    def testThrowOnOverstep(self):
         ray.init(num_cpus=1, num_gpus=1)
         runner = TrialRunner(BasicVariantGenerator())
+        runner.step()
+        self.assertRaises(TuneError, runner.step)
+
+    def testFailureRecoveryDisabled(self):
+        ray.init(num_cpus=1, num_gpus=1)
+        searchalg, scheduler = create_mock_components()
+
+        runner = TrialRunner(searchalg, scheduler=scheduler)
         kwargs = {
             "resources": Resources(cpu=1, gpu=1),
             "checkpoint_freq": 1,
@@ -944,10 +1091,15 @@ def testFailureRecoveryDisabled(self):
         runner.step()
         self.assertEqual(trials[0].status, Trial.ERROR)
         self.assertEqual(trials[0].num_failures, 1)
+        self.assertEqual(len(searchalg.errored_trials), 1)
+        self.assertEqual(len(scheduler.errored_trials), 1)
 
     def testFailureRecoveryEnabled(self):
         ray.init(num_cpus=1, num_gpus=1)
-        runner = TrialRunner(BasicVariantGenerator())
+        searchalg, scheduler = create_mock_components()
+
+        runner = TrialRunner(searchalg, scheduler=scheduler)
+
         kwargs = {
             "resources": Resources(cpu=1, gpu=1),
             "checkpoint_freq": 1,
@@ -968,6 +1120,40 @@ def testFailureRecoveryEnabled(self):
         self.assertEqual(trials[0].num_failures, 1)
         runner.step()
         self.assertEqual(trials[0].status, Trial.RUNNING)
+        self.assertEqual(len(searchalg.errored_trials), 0)
+        self.assertEqual(len(scheduler.errored_trials), 0)
+
+    def testFailureRecoveryNodeRemoval(self):
+        ray.init(num_cpus=1, num_gpus=1)
+        searchalg, scheduler = create_mock_components()
+
+        runner = TrialRunner(searchalg, scheduler=scheduler)
+
+        kwargs = {
+            "resources": Resources(cpu=1, gpu=1),
+            "checkpoint_freq": 1,
+            "max_failures": 1,
+            "config": {
+                "mock_error": True,
+            },
+        }
+        runner.add_trial(Trial("__fake", **kwargs))
+        trials = runner.get_trials()
+
+        with patch('ray.global_state.cluster_resources') as resource_mock:
+            resource_mock.return_value = {"CPU": 1, "GPU": 1}
+            runner.step()
+            self.assertEqual(trials[0].status, Trial.RUNNING)
+            runner.step()
+            self.assertEqual(trials[0].status, Trial.RUNNING)
+
+            # Mimic a node failure
+            resource_mock.return_value = {"CPU": 0, "GPU": 0}
+            runner.step()
+            self.assertEqual(trials[0].status, Trial.PENDING)
+            self.assertEqual(trials[0].num_failures, 1)
+            self.assertEqual(len(searchalg.errored_trials), 0)
+            self.assertEqual(len(scheduler.errored_trials), 1)
 
     def testFailureRecoveryMaxFailures(self):
         ray.init(num_cpus=1, num_gpus=1)
@@ -1320,6 +1506,55 @@ def testSearchAlgStalled(self):
         self.assertTrue(searcher.is_finished())
         self.assertTrue(runner.is_finished())
 
+    def testSearchAlgFinishes(self):
+        """Empty SearchAlg changing state in `next_trials` does not crash."""
+
+        class FinishFastAlg(SuggestionAlgorithm):
+            _index = 0
+
+            def next_trials(self):
+                trials = []
+                self._index += 1
+
+                for trial in self._trial_generator:
+                    trials += [trial]
+                    break
+
+                if self._index > 4:
+                    self._finished = True
+                return trials
+
+            def _suggest(self, trial_id):
+                return {}
+
+        ray.init(num_cpus=2)
+        experiment_spec = {
+            "run": "__fake",
+            "num_samples": 2,
+            "stop": {
+                "training_iteration": 1
+            }
+        }
+        searcher = FinishFastAlg()
+        experiments = [Experiment.from_json("test", experiment_spec)]
+        searcher.add_configurations(experiments)
+
+        runner = TrialRunner(search_alg=searcher)
+        self.assertFalse(runner.is_finished())
+        runner.step()  # This launches a new run
+        runner.step()  # This launches a 2nd run
+        self.assertFalse(searcher.is_finished())
+        self.assertFalse(runner.is_finished())
+        runner.step()  # This kills the first run
+        self.assertFalse(searcher.is_finished())
+        self.assertFalse(runner.is_finished())
+        runner.step()  # This kills the 2nd run
+        self.assertFalse(searcher.is_finished())
+        self.assertFalse(runner.is_finished())
+        runner.step()  # this converts self._finished to True
+        self.assertTrue(searcher.is_finished())
+        self.assertRaises(TuneError, runner.step)
+
 
 if __name__ == "__main__":
     unittest.main(verbosity=2)
diff --git a/python/ray/tune/trainable.py b/python/ray/tune/trainable.py
index 1e537d26d953d..5824c5221ff5b 100644
--- a/python/ray/tune/trainable.py
+++ b/python/ray/tune/trainable.py
@@ -4,6 +4,7 @@
 
 from datetime import datetime
 
+import copy
 import gzip
 import io
 import logging
@@ -83,7 +84,7 @@ def __init__(self, config=None, logger_creator=None):
         self._timesteps_since_restore = 0
         self._iterations_since_restore = 0
         self._restored = False
-        self._setup()
+        self._setup(copy.deepcopy(self.config))
         self._local_ip = ray.services.get_node_ip_address()
 
     @classmethod
@@ -143,6 +144,8 @@ def train(self):
 
         start = time.time()
         result = self._train()
+        assert isinstance(result, dict), "_train() needs to return a dict."
+
         result = result.copy()
 
         self._iteration += 1
@@ -158,14 +161,14 @@ def train(self):
         result.setdefault(DONE, False)
 
         # self._timesteps_total should only be tracked if increments provided
-        if result.get(TIMESTEPS_THIS_ITER):
+        if result.get(TIMESTEPS_THIS_ITER) is not None:
             if self._timesteps_total is None:
                 self._timesteps_total = 0
             self._timesteps_total += result[TIMESTEPS_THIS_ITER]
             self._timesteps_since_restore += result[TIMESTEPS_THIS_ITER]
 
-        # self._timesteps_total should only be tracked if increments provided
-        if result.get(EPISODES_THIS_ITER):
+        # self._episodes_total should only be tracked if increments provided
+        if result.get(EPISODES_THIS_ITER) is not None:
             if self._episodes_total is None:
                 self._episodes_total = 0
             self._episodes_total += result[EPISODES_THIS_ITER]
@@ -211,11 +214,38 @@ def save(self, checkpoint_dir=None):
             Checkpoint path that may be passed to restore().
         """
 
-        checkpoint_path = self._save(checkpoint_dir or self.logdir)
-        pickle.dump([
-            self._experiment_id, self._iteration, self._timesteps_total,
-            self._time_total, self._episodes_total
-        ], open(checkpoint_path + ".tune_metadata", "wb"))
+        checkpoint_dir = os.path.join(checkpoint_dir or self.logdir,
+                                      "checkpoint_{}".format(self._iteration))
+        os.makedirs(checkpoint_dir)
+        checkpoint = self._save(checkpoint_dir)
+        saved_as_dict = False
+        if isinstance(checkpoint, str):
+            if (not checkpoint.startswith(checkpoint_dir)
+                    or checkpoint == checkpoint_dir):
+                raise ValueError(
+                    "The returned checkpoint path must be within the "
+                    "given checkpoint dir {}: {}".format(
+                        checkpoint_dir, checkpoint))
+            if not os.path.exists(checkpoint):
+                raise ValueError(
+                    "The returned checkpoint path does not exist: {}".format(
+                        checkpoint))
+            checkpoint_path = checkpoint
+        elif isinstance(checkpoint, dict):
+            saved_as_dict = True
+            checkpoint_path = os.path.join(checkpoint_dir, "checkpoint")
+            with open(checkpoint_path, "wb") as f:
+                pickle.dump(checkpoint, f)
+        else:
+            raise ValueError("Return value from `_save` must be dict or str.")
+        pickle.dump({
+            "experiment_id": self._experiment_id,
+            "iteration": self._iteration,
+            "timesteps_total": self._timesteps_total,
+            "time_total": self._time_total,
+            "episodes_total": self._episodes_total,
+            "saved_as_dict": saved_as_dict
+        }, open(checkpoint_path + ".tune_metadata", "wb"))
         return checkpoint_path
 
     def save_to_object(self):
@@ -259,13 +289,19 @@ def restore(self, checkpoint_path):
         This method restores additional metadata saved with the checkpoint.
         """
 
-        self._restore(checkpoint_path)
         metadata = pickle.load(open(checkpoint_path + ".tune_metadata", "rb"))
-        self._experiment_id = metadata[0]
-        self._iteration = metadata[1]
-        self._timesteps_total = metadata[2]
-        self._time_total = metadata[3]
-        self._episodes_total = metadata[4]
+        self._experiment_id = metadata["experiment_id"]
+        self._iteration = metadata["iteration"]
+        self._timesteps_total = metadata["timesteps_total"]
+        self._time_total = metadata["time_total"]
+        self._episodes_total = metadata["episodes_total"]
+        saved_as_dict = metadata["saved_as_dict"]
+        if saved_as_dict:
+            with open(checkpoint_path, "rb") as loaded_state:
+                checkpoint_dict = pickle.load(loaded_state)
+            self._restore(checkpoint_dict)
+        else:
+            self._restore(checkpoint_path)
         self._restored = True
 
     def restore_from_object(self, obj):
@@ -318,30 +354,39 @@ def _save(self, checkpoint_dir):
 
         Args:
             checkpoint_dir (str): The directory where the checkpoint
-                can be stored.
+                file must be stored.
 
         Returns:
-            Checkpoint path that may be passed to restore(). Typically
-                would default to `checkpoint_dir`.
+            checkpoint (str | dict): If string, the return value is
+                expected to be the checkpoint path that will be passed to
+                `_restore()`. If dict, the return value will be automatically
+                serialized by Tune and passed to `_restore()`.
+
+        Examples:
+            >>> print(trainable1._save("/tmp/checkpoint_1"))
+            "/tmp/checkpoint_1/my_checkpoint_file"
+            >>> print(trainable2._save("/tmp/checkpoint_2"))
+            {"some": "data"}
         """
 
         raise NotImplementedError
 
-    def _restore(self, checkpoint_path):
+    def _restore(self, checkpoint):
         """Subclasses should override this to implement restore().
 
         Args:
-            checkpoint_path (str): The directory where the checkpoint
-                is stored.
+            checkpoint (str | dict): Value as returned by `_save`.
+                If a string, then it is the checkpoint path.
         """
 
         raise NotImplementedError
 
-    def _setup(self):
+    def _setup(self, config):
         """Subclasses should override this for custom initialization.
 
-        Subclasses can access the hyperparameter configuration via
-        ``self.config``.
+        Args:
+            config (dict): Hyperparameters and other configs given.
+                Copy of `self.config`.
         """
         pass
 
diff --git a/python/ray/tune/trial.py b/python/ray/tune/trial.py
index 98fcbc6d55e60..f60fd25f2dbac 100644
--- a/python/ray/tune/trial.py
+++ b/python/ray/tune/trial.py
@@ -8,6 +8,7 @@
 import time
 import tempfile
 import os
+from numbers import Number
 
 import ray
 from ray.tune import TuneError
@@ -33,12 +34,14 @@ class Resources(
         namedtuple("Resources", ["cpu", "gpu", "extra_cpu", "extra_gpu"])):
     """Ray resources required to schedule a trial.
 
+    TODO: Custom resources.
+
     Attributes:
-        cpu (int): Number of CPUs to allocate to the trial.
-        gpu (int): Number of GPUs to allocate to the trial.
-        extra_cpu (int): Extra CPUs to reserve in case the trial needs to
+        cpu (float): Number of CPUs to allocate to the trial.
+        gpu (float): Number of GPUs to allocate to the trial.
+        extra_cpu (float): Extra CPUs to reserve in case the trial needs to
             launch additional Ray actors that use CPUs.
-        extra_gpu (int): Extra GPUs to reserve in case the trial needs to
+        extra_gpu (float): Extra GPUs to reserve in case the trial needs to
             launch additional Ray actors that use GPUs.
 
     """
@@ -46,6 +49,9 @@ class Resources(
     __slots__ = ()
 
     def __new__(cls, cpu, gpu, extra_cpu=0, extra_gpu=0):
+        for entry in [cpu, gpu, extra_cpu, extra_gpu]:
+            assert isinstance(entry, Number), "Improper resource value."
+            assert entry >= 0, "Resource cannot be negative."
         return super(Resources, cls).__new__(cls, cpu, gpu, extra_cpu,
                                              extra_gpu)
 
@@ -79,9 +85,10 @@ class Checkpoint(object):
     MEMORY = "memory"
     DISK = "disk"
 
-    def __init__(self, storage, value):
+    def __init__(self, storage, value, last_result=None):
         self.storage = storage
         self.value = value
+        self.last_result = last_result
 
     @staticmethod
     def from_object(value=None):
@@ -209,17 +216,19 @@ def should_stop(self, result):
 
         return False
 
-    def should_checkpoint(self, result):
+    def should_checkpoint(self):
         """Whether this trial is due for checkpointing."""
+        result = self.last_result or {}
 
         if result.get(DONE) and self.checkpoint_at_end:
             return True
 
-        if not self.checkpoint_freq:
+        if self.checkpoint_freq:
+            return result.get(TRAINING_ITERATION,
+                              0) % self.checkpoint_freq == 0
+        else:
             return False
 
-        return self.last_result[TRAINING_ITERATION] % self.checkpoint_freq == 0
-
     def progress_string(self):
         """Returns a progress message for printing out to the console."""
 
@@ -271,6 +280,16 @@ def _status_string(self):
     def has_checkpoint(self):
         return self._checkpoint.value is not None
 
+    def should_recover(self):
+        """Returns whether the trial qualifies for restoring.
+
+        This is if a checkpoint frequency is set and has not failed more than
+        max_failures. This may return true even when there may not yet
+        be a checkpoint.
+        """
+        return (self.checkpoint_freq > 0
+                and self.num_failures < self.max_failures)
+
     def update_last_result(self, result, terminate=False):
         if terminate:
             result.update(done=True)
@@ -299,8 +318,10 @@ def __repr__(self):
     def __str__(self):
         """Combines ``env`` with ``trainable_name`` and ``experiment_tag``."""
         if "env" in self.config:
-            identifier = "{}_{}".format(self.trainable_name,
-                                        self.config["env"])
+            env = self.config["env"]
+            if isinstance(env, type):
+                env = env.__name__
+            identifier = "{}_{}".format(self.trainable_name, env)
         else:
             identifier = self.trainable_name
         if self.experiment_tag:
diff --git a/python/ray/tune/trial_executor.py b/python/ray/tune/trial_executor.py
index b961d12b8cbe4..063129780b47a 100644
--- a/python/ray/tune/trial_executor.py
+++ b/python/ray/tune/trial_executor.py
@@ -4,7 +4,6 @@
 from __future__ import print_function
 
 import logging
-import traceback
 
 from ray.tune.trial import Trial, Checkpoint
 
@@ -33,12 +32,10 @@ def has_resources(self, resources):
                                   "has_resources() method")
 
     def start_trial(self, trial, checkpoint=None):
-        """Starts the trial restoring from checkpoint if checkpoint != None.
-
-        If an error is encountered when starting the trial, an exception will
-        be thrown.
+        """Starts the trial restoring from checkpoint if checkpoint is provided.
 
         Args:
+            trial (Trial): Trial to be started.
             checkpoint(Checkpoint): A Python object or path storing the state
             of trial.
         """
@@ -60,26 +57,6 @@ def stop_trial(self, trial, error=False, error_msg=None, stop_logger=True):
         raise NotImplementedError("Subclasses of TrialExecutor must provide "
                                   "stop_trial() method")
 
-    def restart_trial(self, trial, error_msg=None):
-        """Restarts the trial.
-
-        The state of the trial should restore from the last checkpoint.
-
-        Args:
-            error_msg (str): Optional error message.
-        """
-        try:
-            logger.info(
-                "Attempting to recover trial state from last checkpoint")
-            self.stop_trial(
-                trial, error=True, error_msg=error_msg, stop_logger=False)
-            trial.result_logger.flush()
-            self.start_trial(trial)
-        except Exception:
-            error_msg = traceback.format_exc()
-            logger.exception("Error recovering trial from checkpoint, abort.")
-            self.stop_trial(trial, error=True, error_msg=error_msg)
-
     def continue_training(self, trial):
         """Continues the training of this trial."""
         pass
@@ -158,7 +135,11 @@ def fetch_result(self, trial):
 
     def debug_string(self):
         """Returns a human readable message for printing to the console."""
-        pass
+        raise NotImplementedError
+
+    def resource_string(self):
+        """Returns a string describing the total resources available."""
+        raise NotImplementedError
 
     def restore(self, trial, checkpoint=None):
         """Restores training state from a checkpoint.
diff --git a/python/ray/tune/trial_runner.py b/python/ray/tune/trial_runner.py
index 6423d6a95f10e..84457ff8d9e95 100644
--- a/python/ray/tune/trial_runner.py
+++ b/python/ray/tune/trial_runner.py
@@ -12,7 +12,7 @@
 from ray.tune import TuneError
 from ray.tune.ray_trial_executor import RayTrialExecutor
 from ray.tune.result import TIME_THIS_ITER_S
-from ray.tune.trial import Trial
+from ray.tune.trial import Trial, Checkpoint
 from ray.tune.schedulers import FIFOScheduler, TrialScheduler
 from ray.tune.web_server import TuneServer
 
@@ -108,6 +108,8 @@ def step(self):
         Callers should typically run this method repeatedly in a loop. They
         may inspect or modify the runner's state in between calls to step().
         """
+        if self.is_finished():
+            raise TuneError("Called step when all trials finished?")
         self.trial_executor.on_step_begin()
         next_trial = self._get_next_trial()
         if next_trial is not None:
@@ -120,20 +122,19 @@ def step(self):
                     if not self.has_resources(trial.resources):
                         raise TuneError(
                             ("Insufficient cluster resources to launch trial: "
-                             "trial requested {} but the cluster summary: {} "
+                             "trial requested {} but the cluster has only {}. "
                              "Pass `queue_trials=True` in "
                              "ray.tune.run_experiments() or on the command "
                              "line to queue trials until the cluster scales "
                              "up. {}").format(
                                  trial.resources.summary_string(),
-                                 self.trial_executor.debug_string(),
+                                 self.trial_executor.resource_string(),
                                  trial._get_trainable_cls().resource_help(
                                      trial.config)))
                 elif trial.status == Trial.PAUSED:
                     raise TuneError(
                         "There are paused trials, but no more pending "
                         "trials with sufficient resources.")
-            raise TuneError("Called step when all trials finished?")
 
         if self._server:
             self._process_requests()
@@ -215,8 +216,29 @@ def _debug_messages(self):
         messages = ["== Status =="]
         messages.append(self._scheduler_alg.debug_string())
         messages.append(self.trial_executor.debug_string())
+        messages.append(self._memory_debug_string())
         return messages
 
+    def _memory_debug_string(self):
+        try:
+            import psutil
+            total_gb = psutil.virtual_memory().total / 1e9
+            used_gb = total_gb - psutil.virtual_memory().available / 1e9
+            if used_gb > total_gb * 0.9:
+                warn = (": ***LOW MEMORY*** less than 10% of the memory on "
+                        "this node is available for use. This can cause "
+                        "unexpected crashes. Consider "
+                        "reducing the memory used by your application "
+                        "or reducing the Ray object store size by setting "
+                        "`object_store_memory` when calling `ray.init`.")
+            else:
+                warn = ""
+            return "Memory usage on this node: {}/{} GB{}".format(
+                round(used_gb, 1), round(total_gb, 1), warn)
+        except ImportError:
+            return ("Unknown memory usage. Please run `pip install psutil` "
+                    "(or ray[debug]) to resolve)")
+
     def has_resources(self, resources):
         """Returns whether this runner has at least the specified resources."""
         return self.trial_executor.has_resources(resources)
@@ -257,17 +279,14 @@ def _process_events(self):
                 result, terminate=(decision == TrialScheduler.STOP))
 
             if decision == TrialScheduler.CONTINUE:
-                if trial.should_checkpoint(result):
-                    # TODO(rliaw): This is a blocking call
-                    self.trial_executor.save(trial)
+                self._checkpoint_if_needed(trial)
                 self.trial_executor.continue_training(trial)
             elif decision == TrialScheduler.PAUSE:
                 self.trial_executor.pause_trial(trial)
             elif decision == TrialScheduler.STOP:
                 # Checkpoint before ending the trial
                 # if checkpoint_at_end experiment option is set to True
-                if trial.should_checkpoint(result):
-                    self.trial_executor.save(trial)
+                self._checkpoint_if_needed(trial)
                 self.trial_executor.stop_trial(trial)
             else:
                 assert False, "Invalid scheduling decision: {}".format(
@@ -276,24 +295,61 @@ def _process_events(self):
             logger.exception("Error processing event.")
             error_msg = traceback.format_exc()
             if trial.status == Trial.RUNNING:
-                if trial.has_checkpoint() and \
-                        trial.num_failures < trial.max_failures:
+                if trial.should_recover():
                     self._try_recover(trial, error_msg)
                 else:
                     self._scheduler_alg.on_trial_error(self, trial)
                     self._search_alg.on_trial_complete(
                         trial.trial_id, error=True)
-                    self.trial_executor.stop_trial(trial, True, error_msg)
+                    self.trial_executor.stop_trial(
+                        trial, error=True, error_msg=error_msg)
+
+    def _checkpoint_if_needed(self, trial):
+        """Checkpoints trial based off trial.last_result."""
+        if trial.should_checkpoint():
+            # Save trial runtime if possible
+            if hasattr(trial, "runner") and trial.runner:
+                self.trial_executor.save(trial, storage=Checkpoint.DISK)
 
     def _try_recover(self, trial, error_msg):
+        """Tries to recover trial.
+
+        Notifies SearchAlgorithm and Scheduler if failure to recover.
+
+        Args:
+            trial (Trial): Trial to recover.
+            error_msg (str): Error message from prior to invoking this method.
+        """
         try:
-            logger.info("Attempting to recover"
-                        " trial state from last checkpoint.")
-            self.trial_executor.restart_trial(trial, error_msg)
+            self.trial_executor.stop_trial(
+                trial,
+                error=error_msg is not None,
+                error_msg=error_msg,
+                stop_logger=False)
+            trial.result_logger.flush()
+            if self.trial_executor.has_resources(trial.resources):
+                logger.info("Attempting to recover"
+                            " trial state from last checkpoint.")
+                self.trial_executor.start_trial(trial)
+                if trial.status == Trial.ERROR:
+                    raise RuntimeError("Trial did not start correctly.")
+            else:
+                logger.debug("Notifying Scheduler and requeueing trial.")
+                self._requeue_trial(trial)
         except Exception:
-            error_msg = traceback.format_exc()
-            logger.warning("Error recovering trial from checkpoint, abort.")
-            self.trial_executor.stop_trial(trial, True, error_msg=error_msg)
+            logger.exception("Error recovering trial from checkpoint, abort.")
+            self._scheduler_alg.on_trial_error(self, trial)
+            self._search_alg.on_trial_complete(trial.trial_id, error=True)
+
+    def _requeue_trial(self, trial):
+        """Notification to TrialScheduler and requeue trial.
+
+        This does not notify the SearchAlgorithm because
+        the function evaluation is still in progress.
+        """
+        self._scheduler_alg.on_trial_error(self, trial)
+        trial.status = Trial.PENDING
+        self._scheduler_alg.on_trial_add(self, trial)
 
     def _update_trial_queue(self, blocking=False, timeout=600):
         """Adds next trials to queue if possible.
@@ -302,13 +358,15 @@ def _update_trial_queue(self, blocking=False, timeout=600):
 
         Args:
             blocking (bool): Blocks until either a trial is available
-                or the Runner finishes (i.e., timeout or search algorithm
-                finishes).
+                or is_finished (timeout or search algorithm finishes).
             timeout (int): Seconds before blocking times out.
         """
         trials = self._search_alg.next_trials()
         if blocking and not trials:
             start = time.time()
+            # Checking `is_finished` instead of _search_alg.is_finished
+            # is fine because blocking only occurs if all trials are
+            # finished and search_algorithm is not yet finished
             while (not trials and not self.is_finished()
                    and time.time() - start < timeout):
                 logger.info("Blocking for next trial...")
diff --git a/python/ray/tune/util.py b/python/ray/tune/util.py
index 691d25adbe97e..9c047fd80043e 100644
--- a/python/ray/tune/util.py
+++ b/python/ray/tune/util.py
@@ -28,7 +28,7 @@ def pin_in_object_store(obj):
 def get_pinned_object(pinned_id):
     """Retrieve a pinned object from the object store."""
 
-    from ray.local_scheduler import ObjectID
+    from ray.raylet import ObjectID
 
     return _from_pinnable(
         ray.get(
diff --git a/python/ray/utils.py b/python/ray/utils.py
index 0f6adaea98683..e75e006721444 100644
--- a/python/ray/utils.py
+++ b/python/ray/utils.py
@@ -5,6 +5,7 @@
 import binascii
 import functools
 import hashlib
+import inspect
 import numpy as np
 import os
 import subprocess
@@ -14,11 +15,9 @@
 import uuid
 
 import ray.gcs_utils
-import ray.local_scheduler
+import ray.raylet
 import ray.ray_constants as ray_constants
 
-ERROR_KEY_PREFIX = b"Error:"
-
 
 def _random_string():
     id_hash = hashlib.sha1()
@@ -69,22 +68,12 @@ def push_error_to_driver(worker,
     """
     if driver_id is None:
         driver_id = ray_constants.NIL_JOB_ID.id()
-    error_key = ERROR_KEY_PREFIX + driver_id + b":" + _random_string()
     data = {} if data is None else data
-    if not worker.use_raylet:
-        worker.redis_client.hmset(error_key, {
-            "type": error_type,
-            "message": message,
-            "data": data
-        })
-        worker.redis_client.rpush("ErrorKeys", error_key)
-    else:
-        worker.local_scheduler_client.push_error(
-            ray.ObjectID(driver_id), error_type, message, time.time())
+    worker.local_scheduler_client.push_error(
+        ray.ObjectID(driver_id), error_type, message, time.time())
 
 
 def push_error_to_driver_through_redis(redis_client,
-                                       use_raylet,
                                        error_type,
                                        message,
                                        driver_id=None,
@@ -98,8 +87,6 @@ def push_error_to_driver_through_redis(redis_client,
 
     Args:
         redis_client: The redis client to use.
-        use_raylet: True if we are using the Raylet code path and false
-            otherwise.
         error_type (str): The type of the error.
         message (str): The message that will be printed in the background
             on the driver.
@@ -110,23 +97,14 @@ def push_error_to_driver_through_redis(redis_client,
     """
     if driver_id is None:
         driver_id = ray_constants.NIL_JOB_ID.id()
-    error_key = ERROR_KEY_PREFIX + driver_id + b":" + _random_string()
     data = {} if data is None else data
-    if not use_raylet:
-        redis_client.hmset(error_key, {
-            "type": error_type,
-            "message": message,
-            "data": data
-        })
-        redis_client.rpush("ErrorKeys", error_key)
-    else:
-        # Do everything in Python and through the Python Redis client instead
-        # of through the raylet.
-        error_data = ray.gcs_utils.construct_error_message(
-            driver_id, error_type, message, time.time())
-        redis_client.execute_command(
-            "RAY.TABLE_APPEND", ray.gcs_utils.TablePrefix.ERROR_INFO,
-            ray.gcs_utils.TablePubsub.ERROR_INFO, driver_id, error_data)
+    # Do everything in Python and through the Python Redis client instead
+    # of through the raylet.
+    error_data = ray.gcs_utils.construct_error_message(driver_id, error_type,
+                                                       message, time.time())
+    redis_client.execute_command(
+        "RAY.TABLE_APPEND", ray.gcs_utils.TablePrefix.ERROR_INFO,
+        ray.gcs_utils.TablePubsub.ERROR_INFO, driver_id, error_data)
 
 
 def is_cython(obj):
@@ -144,6 +122,23 @@ def check_cython(x):
         (hasattr(obj, "__func__") and check_cython(obj.__func__))
 
 
+def is_function_or_method(obj):
+    """Check if an object is a function or method.
+
+    Args:
+        obj: The Python object in question.
+
+    Returns:
+        True if the object is an function or method.
+    """
+    return (inspect.isfunction(obj) or inspect.ismethod(obj) or is_cython(obj))
+
+
+def is_class_method(f):
+    """Returns whether the given method is a class_method."""
+    return hasattr(f, "__self__") and f.__self__ is not None
+
+
 def random_string():
     """Generate a random string to use as an ID.
 
@@ -329,6 +324,28 @@ def get_system_memory():
         return sysctl(["sysctl", "hw.memsize"])
 
 
+def get_shared_memory_bytes():
+    """Get the size of the shared memory file system.
+
+    Returns:
+        The size of the shared memory file system in bytes.
+    """
+    # Make sure this is only called on Linux.
+    assert sys.platform == "linux" or sys.platform == "linux2"
+
+    shm_fd = os.open("/dev/shm", os.O_RDONLY)
+    try:
+        shm_fs_stats = os.fstatvfs(shm_fd)
+        # The value shm_fs_stats.f_bsize is the block size and the
+        # value shm_fs_stats.f_bavail is the number of available
+        # blocks.
+        shm_avail = shm_fs_stats.f_bsize * shm_fs_stats.f_bavail
+    finally:
+        os.close(shm_fd)
+
+    return shm_avail
+
+
 def check_oversized_pickle(pickled, name, obj_type, worker):
     """Send a warning message if the pickled object is too large.
 
@@ -406,3 +423,7 @@ def thread_safe_client(client, lock=None):
     if lock is None:
         lock = threading.Lock()
     return _ThreadSafeProxy(client, lock)
+
+
+def is_main_thread():
+    return threading.current_thread().getName() == "MainThread"
diff --git a/python/ray/worker.py b/python/ray/worker.py
index 2d1d45f65b1c3..de2513780ad5a 100644
--- a/python/ray/worker.py
+++ b/python/ray/worker.py
@@ -2,9 +2,10 @@
 from __future__ import division
 from __future__ import print_function
 
+from contextlib import contextmanager
 import atexit
-import collections
 import colorama
+import faulthandler
 import hashlib
 import inspect
 import logging
@@ -23,17 +24,19 @@
 import ray.cloudpickle as pickle
 import ray.experimental.state as state
 import ray.gcs_utils
+import ray.memory_monitor as memory_monitor
 import ray.remote_function
 import ray.serialization as serialization
 import ray.services as services
 import ray.signature
-import ray.local_scheduler
+import ray.tempfile_services as tempfile_services
+import ray.raylet
 import ray.plasma
 import ray.ray_constants as ray_constants
 from ray import import_thread
 from ray import profiling
+from ray.function_manager import FunctionActorManager
 from ray.utils import (
-    binary_to_hex,
     check_oversized_pickle,
     is_cython,
     random_string,
@@ -55,14 +58,6 @@
 NIL_ACTOR_HANDLE_ID = NIL_ID
 NIL_CLIENT_ID = ray_constants.ID_SIZE * b"\xff"
 
-# This must be kept in sync with the `error_types` array in
-# common/state/error_table.h.
-OBJECT_HASH_MISMATCH_ERROR_TYPE = b"object_hash_mismatch"
-PUT_RECONSTRUCTION_ERROR_TYPE = b"put_reconstruction"
-
-# This must be kept in sync with the `scheduling_state` enum in common/task.h.
-TASK_STATUS_RUNNING = 8
-
 # Default resource requirements for actors when no resource requirements are
 # specified.
 DEFAULT_ACTOR_METHOD_CPUS_SIMPLE_CASE = 1
@@ -77,6 +72,11 @@
 # using logging.basicConfig in its entry/init points.
 logger = logging.getLogger(__name__)
 
+try:
+    import setproctitle
+except ImportError:
+    setproctitle = None
+
 
 class RayTaskError(Exception):
     """An object used internally to represent a task that threw an exception.
@@ -175,11 +175,6 @@ def __str__(self):
                     self.task_error))
 
 
-FunctionExecutionInfo = collections.namedtuple(
-    "FunctionExecutionInfo", ["function", "function_name", "max_calls"])
-"""FunctionExecutionInfo: A named tuple storing remote function information."""
-
-
 class Worker(object):
     """A class used to define the control flow of a worker process.
 
@@ -188,19 +183,9 @@ class Worker(object):
         functions outside of this class are considered exposed.
 
     Attributes:
-        function_execution_info (Dict[str, FunctionExecutionInfo]): A
-            dictionary mapping the name of a remote function to the remote
-            function itself. This is the set of remote functions that can be
-            executed by this worker.
         connected (bool): True if Ray has been started and False otherwise.
         mode: The mode of the worker. One of SCRIPT_MODE, LOCAL_MODE, and
             WORKER_MODE.
-        cached_remote_functions_and_actors: A list of information for exporting
-            remote functions and actor classes definitions that were defined
-            before the worker called connect. When the worker eventually does
-            call connect, if it is a driver, it will export these functions and
-            actors. If cached_remote_functions_and_actors is None, that means
-            that connect has been called already.
         cached_functions_to_run (List): A list of functions to run on all of
             the workers that should be exported as soon as connect is called.
         profiler: the profiler used to aggregate profiling information.
@@ -215,24 +200,9 @@ class Worker(object):
 
     def __init__(self):
         """Initialize a Worker object."""
-        # This field is a dictionary that maps a driver ID to a dictionary of
-        # functions (and information about those functions) that have been
-        # registered for that driver (this inner dictionary maps function IDs
-        # to a FunctionExecutionInfo object. This should only be used on
-        # workers that execute remote functions.
-        self.function_execution_info = collections.defaultdict(lambda: {})
-        # This is a dictionary mapping driver ID to a dictionary that maps
-        # remote function IDs for that driver to a counter of the number of
-        # times that remote function has been executed on this worker. The
-        # counter is incremented every time the function is executed on this
-        # worker. When the counter reaches the maximum number of executions
-        # allowed for a particular function, the worker is killed.
-        self.num_task_executions = collections.defaultdict(lambda: {})
         self.connected = False
         self.mode = None
-        self.cached_remote_functions_and_actors = []
         self.cached_functions_to_run = []
-        self.fetch_and_register_actor = None
         self.actor_init_error = None
         self.make_actor = None
         self.actors = {}
@@ -247,13 +217,44 @@ def __init__(self):
         # When the worker is constructed. Record the original value of the
         # CUDA_VISIBLE_DEVICES environment variable.
         self.original_gpu_ids = ray.utils.get_cuda_visible_devices()
-        self.profiler = profiling.Profiler(self)
+        self.profiler = None
+        self.memory_monitor = memory_monitor.MemoryMonitor()
         self.state_lock = threading.Lock()
         # A dictionary that maps from driver id to SerializationContext
         # TODO: clean up the SerializationContext once the job finished.
         self.serialization_context_map = {}
+        self.function_actor_manager = FunctionActorManager(self)
+        # Reads/writes to the following fields must be protected by
+        # self.state_lock.
         # Identity of the driver that this worker is processing.
-        self.task_driver_id = None
+        self.task_driver_id = ray.ObjectID(NIL_ID)
+        self.current_task_id = ray.ObjectID(NIL_ID)
+        self.task_index = 0
+        self.put_index = 1
+
+    def get_current_thread_task_id(self):
+        """Get the current thread's task ID.
+
+        This returns the assigned task ID if called on the main thread, else a
+        random task ID.  This method is not thread-safe and must be called with
+        self.state_lock acquired.
+        """
+        current_task_id = self.current_task_id
+        if not ray.utils.is_main_thread():
+            # If this is running on a separate thread, then the mapping
+            # to the current task ID may not be correct. Generate a
+            # random task ID so that the backend can differentiate
+            # between different threads.
+            current_task_id = ray.ObjectID(random_string())
+            if not self.multithreading_warned:
+                logger.warning(
+                    "Calling ray.get or ray.wait in a separate thread "
+                    "may lead to deadlock if the main thread blocks on this "
+                    "thread and there are not enough resources to execute "
+                    "more tasks")
+                self.multithreading_warned = True
+        assert not current_task_id.is_nil()
+        return current_task_id
 
     def mark_actor_init_failed(self, error):
         """Called to mark this actor as failed during initialization."""
@@ -349,7 +350,7 @@ def store_and_register(self, object_id, value, depth=100):
                                        "of their fields. This behavior may "
                                        "be incorrect in some cases.".format(
                                            type(e.example_object)))
-                    logger.warning(warning_message)
+                    logger.debug(warning_message)
                 except (serialization.RayNotDictionarySerializable,
                         serialization.CloudPickleError,
                         pickle.pickle.PicklingError, Exception):
@@ -413,6 +414,17 @@ def put_object(self, object_id, value):
             logger.info(
                 "The object with ID {} already exists in the object store."
                 .format(object_id))
+        except TypeError:
+            # This error can happen because one of the members of the object
+            # may not be serializable for cloudpickle. So we need these extra
+            # fallbacks here to start from the beginning. Hopefully the object
+            # could have a `__reduce__` method.
+            register_custom_serializer(type(value), use_pickle=True)
+            warning_message = ("WARNING: Serializing the class {} failed, "
+                               "so are are falling back to cloudpickle."
+                               .format(type(value)))
+            logger.warning(warning_message)
+            self.store_and_register(object_id, value)
 
     def retrieve_and_deserialize(self, object_ids, timeout, error_timeout=10):
         start_time = time.time()
@@ -439,7 +451,8 @@ def retrieve_and_deserialize(self, object_ids, timeout, error_timeout=10):
                 invalid_error = RayTaskError(
                     "<unknown>", None,
                     "Invalid return value: likely worker died or was killed "
-                    "while executing the task.")
+                    "while executing the task; check previous logs or dmesg "
+                    "for errors.")
                 return [invalid_error] * len(object_ids)
             except pyarrow.DeserializationCallbackError:
                 # Wait a little bit for the import thread to import the class.
@@ -489,13 +502,9 @@ def get_object(self, object_ids):
         ]
         for i in range(0, len(object_ids),
                        ray._config.worker_fetch_request_size()):
-            if not self.use_raylet:
-                self.plasma_client.fetch(plain_object_ids[i:(
-                    i + ray._config.worker_fetch_request_size())])
-            else:
-                self.local_scheduler_client.reconstruct_objects(
-                    object_ids[i:(
-                        i + ray._config.worker_fetch_request_size())], True)
+            self.local_scheduler_client.fetch_or_reconstruct(
+                object_ids[i:(i + ray._config.worker_fetch_request_size())],
+                True)
 
         # Get the objects. We initially try to get the objects immediately.
         final_results = self.retrieve_and_deserialize(plain_object_ids, 0)
@@ -509,6 +518,9 @@ def get_object(self, object_ids):
 
         if len(unready_ids) > 0:
             with self.state_lock:
+                # Get the task ID, to notify the backend which task is blocked.
+                current_task_id = self.get_current_thread_task_id()
+
                 # Try reconstructing any objects we haven't gotten yet. Try to
                 # get them until at least get_timeout_milliseconds
                 # milliseconds passes, then repeat.
@@ -525,25 +537,10 @@ def get_object(self, object_ids):
                         ray._config.worker_fetch_request_size())
                     for i in range(0, len(object_ids_to_fetch),
                                    fetch_request_size):
-                        if not self.use_raylet:
-                            for unready_id in ray_object_ids_to_fetch[i:(
-                                    i + fetch_request_size)]:
-                                (self.local_scheduler_client.
-                                 reconstruct_objects([unready_id], False))
-                            # Do another fetch for objects that aren't
-                            # available locally yet, in case they were evicted
-                            # since the last fetch. We divide the fetch into
-                            # smaller fetches so as to not block the manager
-                            # for a prolonged period of time in a single call.
-                            # This is only necessary for legacy ray since
-                            # reconstruction and fetch are implemented by
-                            # different processes.
-                            self.plasma_client.fetch(object_ids_to_fetch[i:(
-                                i + fetch_request_size)])
-                        else:
-                            self.local_scheduler_client.reconstruct_objects(
-                                ray_object_ids_to_fetch[i:(
-                                    i + fetch_request_size)], False)
+                        self.local_scheduler_client.fetch_or_reconstruct(
+                            ray_object_ids_to_fetch[i:(
+                                i + fetch_request_size)], False,
+                            current_task_id)
                     results = self.retrieve_and_deserialize(
                         object_ids_to_fetch,
                         max([
@@ -561,7 +558,7 @@ def get_object(self, object_ids):
 
                 # If there were objects that we weren't able to get locally,
                 # let the local scheduler know that we're now unblocked.
-                self.local_scheduler_client.notify_unblocked()
+                self.local_scheduler_client.notify_unblocked(current_task_id)
 
         assert len(final_results) == len(object_ids)
         return final_results
@@ -578,6 +575,7 @@ def submit_task(self,
                     execution_dependencies=None,
                     num_return_vals=None,
                     resources=None,
+                    placement_resources=None,
                     driver_id=None):
         """Submit a remote task to the scheduler.
 
@@ -603,6 +601,9 @@ def submit_task(self,
             num_return_vals: The number of return values this function should
                 have.
             resources: The resource requirements for this task.
+            placement_resources: The resources required for placing the task.
+                If this is not provided or if it is an empty dictionary, then
+                the placement resources will be equal to resources.
             driver_id: The ID of the relevant driver. This is almost always the
                 driver ID of the driver that is currently running. However, in
                 the exceptional case that an actor task is being dispatched to
@@ -632,7 +633,7 @@ def submit_task(self,
             for arg in args:
                 if isinstance(arg, ray.ObjectID):
                     args_for_local_scheduler.append(arg)
-                elif ray.local_scheduler.check_simple_value(arg):
+                elif ray.raylet.check_simple_value(arg):
                     args_for_local_scheduler.append(arg)
                 else:
                     args_for_local_scheduler.append(put(arg))
@@ -656,74 +657,28 @@ def submit_task(self,
                     raise ValueError(
                         "Resource quantities must all be whole numbers.")
 
+            if placement_resources is None:
+                placement_resources = {}
+
             with self.state_lock:
                 # Increment the worker's task index to track how many tasks
                 # have been submitted by the current task so far.
                 task_index = self.task_index
                 self.task_index += 1
+                # The parent task must be set for the submitted task.
+                assert not self.current_task_id.is_nil()
             # Submit the task to local scheduler.
-            task = ray.local_scheduler.Task(
+            task = ray.raylet.Task(
                 driver_id, ray.ObjectID(
                     function_id.id()), args_for_local_scheduler,
                 num_return_vals, self.current_task_id, task_index,
                 actor_creation_id, actor_creation_dummy_object_id, actor_id,
-                actor_handle_id, actor_counter, is_actor_checkpoint_method,
-                execution_dependencies, resources, self.use_raylet)
+                actor_handle_id, actor_counter, execution_dependencies,
+                resources, placement_resources)
             self.local_scheduler_client.submit(task)
 
             return task.returns()
 
-    def export_remote_function(self, function_id, function_name, function,
-                               max_calls, decorated_function):
-        """Export a remote function.
-
-        Args:
-            function_id: The ID of the function.
-            function_name: The name of the function.
-            function: The raw undecorated function to export.
-            max_calls: The maximum number of times a given worker can execute
-                this function before exiting.
-            decorated_function: The decorated function (this is used to enable
-                the remote function to recursively call itself).
-        """
-        if self.mode != SCRIPT_MODE:
-            raise Exception("export_remote_function can only be called on a "
-                            "driver.")
-
-        key = (b"RemoteFunction:" + self.task_driver_id.id() + b":" +
-               function_id.id())
-
-        # Work around limitations of Python pickling.
-        function_name_global_valid = function.__name__ in function.__globals__
-        function_name_global_value = function.__globals__.get(
-            function.__name__)
-        # Allow the function to reference itself as a global variable
-        if not is_cython(function):
-            function.__globals__[function.__name__] = decorated_function
-        try:
-            pickled_function = pickle.dumps(function)
-        finally:
-            # Undo our changes
-            if function_name_global_valid:
-                function.__globals__[function.__name__] = (
-                    function_name_global_value)
-            else:
-                del function.__globals__[function.__name__]
-
-        check_oversized_pickle(pickled_function, function_name,
-                               "remote function", self)
-
-        self.redis_client.hmset(
-            key, {
-                "driver_id": self.task_driver_id.id(),
-                "function_id": function_id.id(),
-                "name": function_name,
-                "module": function.__module__,
-                "function": pickled_function,
-                "max_calls": max_calls
-            })
-        self.redis_client.rpush("Exports", key)
-
     def run_function_on_all_workers(self, function,
                                     run_on_other_drivers=False):
         """Run arbitrary code on all of the workers.
@@ -773,7 +728,7 @@ def run_function_on_all_workers(self, function,
                     "driver_id": self.task_driver_id.id(),
                     "function_id": function_to_run_id,
                     "function": pickled_function,
-                    "run_on_other_drivers": run_on_other_drivers
+                    "run_on_other_drivers": str(run_on_other_drivers)
                 })
             self.redis_client.rpush("Exports", key)
             # TODO(rkn): If the worker fails after it calls setnx and before it
@@ -782,47 +737,6 @@ def run_function_on_all_workers(self, function,
             # operations into a transaction (or by implementing a custom
             # command that does all three things).
 
-    def _wait_for_function(self, function_id, driver_id, timeout=10):
-        """Wait until the function to be executed is present on this worker.
-
-        This method will simply loop until the import thread has imported the
-        relevant function. If we spend too long in this loop, that may indicate
-        a problem somewhere and we will push an error message to the user.
-
-        If this worker is an actor, then this will wait until the actor has
-        been defined.
-
-        Args:
-            function_id (str): The ID of the function that we want to execute.
-            driver_id (str): The ID of the driver to push the error message to
-                if this times out.
-        """
-        start_time = time.time()
-        # Only send the warning once.
-        warning_sent = False
-        while True:
-            with self.lock:
-                if (self.actor_id == NIL_ACTOR_ID
-                        and (function_id.id() in
-                             self.function_execution_info[driver_id])):
-                    break
-                elif self.actor_id != NIL_ACTOR_ID and (
-                        self.actor_id in self.actors):
-                    break
-                if time.time() - start_time > timeout:
-                    warning_message = ("This worker was asked to execute a "
-                                       "function that it does not have "
-                                       "registered. You may have to restart "
-                                       "Ray.")
-                    if not warning_sent:
-                        ray.utils.push_error_to_driver(
-                            self,
-                            ray_constants.WAIT_FOR_FUNCTION_PUSH_ERROR,
-                            warning_message,
-                            driver_id=driver_id)
-                    warning_sent = True
-            time.sleep(0.001)
-
     def _get_arguments_for_execution(self, function_name, serialized_args):
         """Retrieve the arguments for the remote function.
 
@@ -863,7 +777,7 @@ def _get_arguments_for_execution(self, function_name, serialized_args):
             arguments.append(argument)
         return arguments
 
-    def _store_outputs_in_objstore(self, object_ids, outputs):
+    def _store_outputs_in_object_store(self, object_ids, outputs):
         """Store the outputs of a remote function in the local object store.
 
         This stores the values that were returned by a remote function in the
@@ -890,7 +804,7 @@ def _store_outputs_in_objstore(self, object_ids, outputs):
 
             self.put_object(object_ids[i], outputs[i])
 
-    def _process_task(self, task):
+    def _process_task(self, task, function_execution_info):
         """Execute a task assigned to this worker.
 
         This method deserializes a task from the scheduler, and attempts to
@@ -900,37 +814,41 @@ def _process_task(self, task):
         (these will be retrieved by calls to get or by subsequent tasks that
         use the outputs of this task).
         """
-        # The ID of the driver that this task belongs to. This is needed so
-        # that if the task throws an exception, we propagate the error
-        # message to the correct driver.
-        self.task_driver_id = task.driver_id()
-        self.current_task_id = task.task_id()
-        self.task_index = 0
-        self.put_index = 1
+        with self.state_lock:
+            assert self.task_driver_id.is_nil()
+            assert self.current_task_id.is_nil()
+            assert self.task_index == 0
+            assert self.put_index == 1
+
+            # The ID of the driver that this task belongs to. This is needed so
+            # that if the task throws an exception, we propagate the error
+            # message to the correct driver.
+            self.task_driver_id = task.driver_id()
+            self.current_task_id = task.task_id()
+
         function_id = task.function_id()
         args = task.arguments()
         return_object_ids = task.returns()
         if task.actor_id().id() != NIL_ACTOR_ID:
             dummy_return_id = return_object_ids.pop()
-        function_executor = self.function_execution_info[
-            self.task_driver_id.id()][function_id.id()].function
-        function_name = self.function_execution_info[self.task_driver_id.id()][
-            function_id.id()].function_name
+        function_executor = function_execution_info.function
+        function_name = function_execution_info.function_name
 
         # Get task arguments from the object store.
         try:
             if function_name != "__ray_terminate__":
                 self.reraise_actor_init_error()
+            self.memory_monitor.raise_if_low_memory()
             with profiling.profile("task:deserialize_arguments", worker=self):
                 arguments = self._get_arguments_for_execution(
                     function_name, args)
         except (RayGetError, RayGetArgumentError) as e:
-            self._handle_process_task_failure(function_id, return_object_ids,
-                                              e, None)
+            self._handle_process_task_failure(function_id, function_name,
+                                              return_object_ids, e, None)
             return
         except Exception as e:
             self._handle_process_task_failure(
-                function_id, return_object_ids, e,
+                function_id, function_name, return_object_ids, e,
                 ray.utils.format_error_message(traceback.format_exc()))
             return
 
@@ -949,8 +867,9 @@ def _process_task(self, task):
             task_exception = task.actor_id().id() == NIL_ACTOR_ID
             traceback_str = ray.utils.format_error_message(
                 traceback.format_exc(), task_exception=task_exception)
-            self._handle_process_task_failure(function_id, return_object_ids,
-                                              e, traceback_str)
+            self._handle_process_task_failure(function_id, function_name,
+                                              return_object_ids, e,
+                                              traceback_str)
             return
 
         # Store the outputs in the local object store.
@@ -962,21 +881,19 @@ def _process_task(self, task):
                 num_returns = len(return_object_ids)
                 if num_returns == 1:
                     outputs = (outputs, )
-                self._store_outputs_in_objstore(return_object_ids, outputs)
+                self._store_outputs_in_object_store(return_object_ids, outputs)
         except Exception as e:
             self._handle_process_task_failure(
-                function_id, return_object_ids, e,
+                function_id, function_name, return_object_ids, e,
                 ray.utils.format_error_message(traceback.format_exc()))
 
-    def _handle_process_task_failure(self, function_id, return_object_ids,
-                                     error, backtrace):
-        function_name = self.function_execution_info[self.task_driver_id.id()][
-            function_id.id()].function_name
+    def _handle_process_task_failure(self, function_id, function_name,
+                                     return_object_ids, error, backtrace):
         failure_object = RayTaskError(function_name, error, backtrace)
         failure_objects = [
             failure_object for _ in range(len(return_object_ids))
         ]
-        self._store_outputs_in_objstore(return_object_ids, failure_objects)
+        self._store_outputs_in_object_store(return_object_ids, failure_objects)
         # Log the error message.
         ray.utils.push_error_to_driver(
             self,
@@ -1013,7 +930,7 @@ def _become_actor(self, task):
             time.sleep(0.001)
 
         with self.lock:
-            self.fetch_and_register_actor(key, self)
+            self.function_actor_manager.fetch_and_register_actor(key)
 
     def _wait_for_and_process_task(self, task):
         """Wait for a task to be ready and process the task.
@@ -1030,11 +947,8 @@ def _wait_for_and_process_task(self, task):
             self._become_actor(task)
             return
 
-        # Wait until the function to be executed has actually been registered
-        # on this worker. We will push warnings to the user if we spend too
-        # long in this loop.
-        with profiling.profile("wait_for_function", worker=self):
-            self._wait_for_function(function_id, driver_id)
+        execution_info = self.function_actor_manager.get_execution_info(
+            driver_id, function_id)
 
         # Execute the task.
         # TODO(rkn): Consider acquiring this lock with a timeout and pushing a
@@ -1042,38 +956,38 @@ def _wait_for_and_process_task(self, task):
         # because that may indicate that the system is hanging, and it'd be
         # good to know where the system is hanging.
         with self.lock:
-
-            function_name = (self.function_execution_info[driver_id][
-                function_id.id()]).function_name
-            if not self.use_raylet:
-                extra_data = {
-                    "function_name": function_name,
-                    "task_id": task.task_id().hex(),
-                    "worker_id": binary_to_hex(self.worker_id)
-                }
+            function_name = execution_info.function_name
+            extra_data = {
+                "name": function_name,
+                "task_id": task.task_id().hex()
+            }
+            if task.actor_id().id() == NIL_ACTOR_ID:
+                title = "ray_worker:{}()".format(function_name)
+                next_title = "ray_worker"
             else:
-                extra_data = {
-                    "name": function_name,
-                    "task_id": task.task_id().hex()
-                }
+                actor = self.actors[task.actor_id().id()]
+                title = "ray_{}:{}()".format(actor.__class__.__name__,
+                                             function_name)
+                next_title = "ray_{}".format(actor.__class__.__name__)
             with profiling.profile("task", extra_data=extra_data, worker=self):
-                self._process_task(task)
-
-        # In the non-raylet code path, push all of the log events to the global
-        # state store. In the raylet code path, this is done periodically in a
-        # background thread.
-        if not self.use_raylet:
-            self.profiler.flush_profile_data()
+                with _changeproctitle(title, next_title):
+                    self._process_task(task, execution_info)
+                # Reset the state fields so the next task can run.
+                with self.state_lock:
+                    self.task_driver_id = ray.ObjectID(NIL_ID)
+                    self.current_task_id = ray.ObjectID(NIL_ID)
+                    self.task_index = 0
+                    self.put_index = 1
 
         # Increase the task execution counter.
-        self.num_task_executions[driver_id][function_id.id()] += 1
+        self.function_actor_manager.increase_task_counter(
+            driver_id, function_id.id())
 
-        reached_max_executions = (
-            self.num_task_executions[driver_id][function_id.id()] == self.
-            function_execution_info[driver_id][function_id.id()].max_calls)
+        reached_max_executions = (self.function_actor_manager.get_task_counter(
+            driver_id, function_id.id()) == execution_info.max_calls)
         if reached_max_executions:
             self.local_scheduler_client.disconnect()
-            os._exit(0)
+            sys.exit(0)
 
     def _get_next_task_from_local_scheduler(self):
         """Get the next task from the local scheduler.
@@ -1081,7 +995,7 @@ def _get_next_task_from_local_scheduler(self):
         Returns:
             A task from the local scheduler.
         """
-        with profiling.profile("get_task", worker=self):
+        with profiling.profile("worker_idle", worker=self):
             task = self.local_scheduler_client.get_task()
 
         # Automatically restrict the GPUs available to this task.
@@ -1118,13 +1032,10 @@ def get_gpu_ids():
         raise Exception("ray.get_gpu_ids() currently does not work in PYTHON "
                         "MODE.")
 
-    if not global_worker.use_raylet:
-        assigned_ids = global_worker.local_scheduler_client.gpu_ids()
-    else:
-        all_resource_ids = global_worker.local_scheduler_client.resource_ids()
-        assigned_ids = [
-            resource_id for resource_id, _ in all_resource_ids.get("GPU", [])
-        ]
+    all_resource_ids = global_worker.local_scheduler_client.resource_ids()
+    assigned_ids = [
+        resource_id for resource_id, _ in all_resource_ids.get("GPU", [])
+    ]
     # If the user had already set CUDA_VISIBLE_DEVICES, then respect that (in
     # the sense that only GPU IDs that appear in CUDA_VISIBLE_DEVICES should be
     # returned).
@@ -1139,17 +1050,11 @@ def get_gpu_ids():
 def get_resource_ids():
     """Get the IDs of the resources that are available to the worker.
 
-    This function is only supported in the raylet code path.
-
     Returns:
         A dictionary mapping the name of a resource to a list of pairs, where
         each pair consists of the ID of a resource and the fraction of that
         resource reserved for this worker.
     """
-    if not global_worker.use_raylet:
-        raise Exception("ray.get_resource_ids() is only supported in the "
-                        "raylet code path.")
-
     if _mode() == LOCAL_MODE:
         raise Exception(
             "ray.get_resource_ids() currently does not work in PYTHON "
@@ -1232,22 +1137,8 @@ def error_applies_to_driver(error_key, worker=global_worker):
 def error_info(worker=global_worker):
     """Return information about failed tasks."""
     worker.check_connected()
-    if worker.use_raylet:
-        return (global_state.error_messages(job_id=worker.task_driver_id) +
-                global_state.error_messages(job_id=ray_constants.NIL_JOB_ID))
-    error_keys = worker.redis_client.lrange("ErrorKeys", 0, -1)
-    errors = []
-    for error_key in error_keys:
-        if error_applies_to_driver(error_key, worker=worker):
-            error_contents = worker.redis_client.hgetall(error_key)
-            error_contents = {
-                "type": ray.utils.decode(error_contents[b"type"]),
-                "message": ray.utils.decode(error_contents[b"message"]),
-                "data": ray.utils.decode(error_contents[b"data"])
-            }
-            errors.append(error_contents)
-
-    return errors
+    return (global_state.error_messages(job_id=worker.task_driver_id) +
+            global_state.error_messages(job_id=ray_constants.NIL_JOB_ID))
 
 
 def _initialize_serialization(driver_id, worker=global_worker):
@@ -1343,121 +1234,57 @@ def actor_handle_deserializer(serialized_obj):
 
 def get_address_info_from_redis_helper(redis_address,
                                        node_ip_address,
-                                       use_raylet=False):
+                                       redis_password=None):
     redis_ip_address, redis_port = redis_address.split(":")
     # For this command to work, some other client (on the same machine as
     # Redis) must have run "CONFIG SET protected-mode no".
     redis_client = redis.StrictRedis(
-        host=redis_ip_address, port=int(redis_port))
-
-    if not use_raylet:
-        # The client table prefix must be kept in sync with the file
-        # "src/common/redis_module/ray_redis_module.cc" where it is defined.
-        client_keys = redis_client.keys("{}*".format(
-            ray.gcs_utils.DB_CLIENT_PREFIX))
-        # Filter to live clients on the same node and do some basic checking.
-        plasma_managers = []
-        local_schedulers = []
-        for key in client_keys:
-            info = redis_client.hgetall(key)
-
-            # Ignore clients that were deleted.
-            deleted = info[b"deleted"]
-            deleted = bool(int(deleted))
-            if deleted:
-                continue
-
-            assert b"ray_client_id" in info
-            assert b"node_ip_address" in info
-            assert b"client_type" in info
-            client_node_ip_address = ray.utils.decode(info[b"node_ip_address"])
-            if (client_node_ip_address == node_ip_address or
-                (client_node_ip_address == "127.0.0.1"
-                 and redis_ip_address == ray.services.get_node_ip_address())):
-                if ray.utils.decode(info[b"client_type"]) == "plasma_manager":
-                    plasma_managers.append(info)
-                elif (ray.utils.decode(
-                        info[b"client_type"]) == "local_scheduler"):
-                    local_schedulers.append(info)
-        # Make sure that we got at least one plasma manager and local
-        # scheduler.
-        assert len(plasma_managers) >= 1
-        assert len(local_schedulers) >= 1
-        # Build the address information.
-        object_store_addresses = []
-        for manager in plasma_managers:
-            address = ray.utils.decode(manager[b"manager_address"])
-            port = services.get_port(address)
-            object_store_addresses.append(
-                services.ObjectStoreAddress(
-                    name=ray.utils.decode(manager[b"store_socket_name"]),
-                    manager_name=ray.utils.decode(
-                        manager[b"manager_socket_name"]),
-                    manager_port=port))
-        scheduler_names = [
-            ray.utils.decode(scheduler[b"local_scheduler_socket_name"])
-            for scheduler in local_schedulers
-        ]
-        client_info = {
-            "node_ip_address": node_ip_address,
-            "redis_address": redis_address,
-            "object_store_addresses": object_store_addresses,
-            "local_scheduler_socket_names": scheduler_names,
-            # Web UI should be running.
-            "webui_url": _webui_url_helper(redis_client)
-        }
-        return client_info
-
-    # Handle the raylet case.
-    else:
-        # In the raylet code path, all client data is stored in a zset at the
-        # key for the nil client.
-        client_key = b"CLIENT" + NIL_CLIENT_ID
-        clients = redis_client.zrange(client_key, 0, -1)
-        raylets = []
-        for client_message in clients:
-            client = ray.gcs_utils.ClientTableData.GetRootAsClientTableData(
-                client_message, 0)
-            client_node_ip_address = ray.utils.decode(
-                client.NodeManagerAddress())
-            if (client_node_ip_address == node_ip_address or
-                (client_node_ip_address == "127.0.0.1"
-                 and redis_ip_address == ray.services.get_node_ip_address())):
-                raylets.append(client)
-        # Make sure that at least one raylet has started locally.
-        # This handles a race condition where Redis has started but
-        # the raylet has not connected.
-        if len(raylets) == 0:
-            raise Exception(
-                "Redis has started but no raylets have registered yet.")
-        object_store_addresses = [
-            services.ObjectStoreAddress(
-                name=ray.utils.decode(raylet.ObjectStoreSocketName()),
-                manager_name=None,
-                manager_port=None) for raylet in raylets
-        ]
-        raylet_socket_names = [
-            ray.utils.decode(raylet.RayletSocketName()) for raylet in raylets
-        ]
-        return {
-            "node_ip_address": node_ip_address,
-            "redis_address": redis_address,
-            "object_store_addresses": object_store_addresses,
-            "raylet_socket_names": raylet_socket_names,
-            # Web UI should be running.
-            "webui_url": _webui_url_helper(redis_client)
-        }
+        host=redis_ip_address, port=int(redis_port), password=redis_password)
+
+    # In the raylet code path, all client data is stored in a zset at the
+    # key for the nil client.
+    client_key = b"CLIENT" + NIL_CLIENT_ID
+    clients = redis_client.zrange(client_key, 0, -1)
+    raylets = []
+    for client_message in clients:
+        client = ray.gcs_utils.ClientTableData.GetRootAsClientTableData(
+            client_message, 0)
+        client_node_ip_address = ray.utils.decode(client.NodeManagerAddress())
+        if (client_node_ip_address == node_ip_address or
+            (client_node_ip_address == "127.0.0.1"
+             and redis_ip_address == ray.services.get_node_ip_address())):
+            raylets.append(client)
+    # Make sure that at least one raylet has started locally.
+    # This handles a race condition where Redis has started but
+    # the raylet has not connected.
+    if len(raylets) == 0:
+        raise Exception(
+            "Redis has started but no raylets have registered yet.")
+    object_store_addresses = [
+        ray.utils.decode(raylet.ObjectStoreSocketName()) for raylet in raylets
+    ]
+    raylet_socket_names = [
+        ray.utils.decode(raylet.RayletSocketName()) for raylet in raylets
+    ]
+    return {
+        "node_ip_address": node_ip_address,
+        "redis_address": redis_address,
+        "object_store_addresses": object_store_addresses,
+        "raylet_socket_names": raylet_socket_names,
+        # Web UI should be running.
+        "webui_url": _webui_url_helper(redis_client)
+    }
 
 
 def get_address_info_from_redis(redis_address,
                                 node_ip_address,
                                 num_retries=5,
-                                use_raylet=False):
+                                redis_password=None):
     counter = 0
     while True:
         try:
             return get_address_info_from_redis_helper(
-                redis_address, node_ip_address, use_raylet=use_raylet)
+                redis_address, node_ip_address, redis_password=redis_password)
         except Exception:
             if counter == num_retries:
                 raise
@@ -1515,6 +1342,8 @@ def _init(address_info=None,
           num_workers=None,
           num_local_schedulers=None,
           object_store_memory=None,
+          redis_max_memory=None,
+          collect_profiling_data=True,
           local_mode=False,
           driver_mode=None,
           redirect_worker_output=False,
@@ -1525,10 +1354,15 @@ def _init(address_info=None,
           resources=None,
           num_redis_shards=None,
           redis_max_clients=None,
+          redis_password=None,
           plasma_directory=None,
           huge_pages=False,
           include_webui=True,
-          use_raylet=None):
+          driver_id=None,
+          plasma_store_socket_name=None,
+          raylet_socket_name=None,
+          temp_dir=None,
+          _internal_config=None):
     """Helper method to connect to an existing Ray cluster or start a new one.
 
     This method handles two cases. Either a Ray cluster already exists and we
@@ -1550,12 +1384,15 @@ def _init(address_info=None,
             object IDs. The same value can be used across multiple runs of the
             same job in order to generate the object IDs in a consistent
             manner. However, the same ID should not be used for different jobs.
-        num_workers (int): The number of workers to start. This is only
-            provided if start_ray_local is True.
         num_local_schedulers (int): The number of local schedulers to start.
             This is only provided if start_ray_local is True.
         object_store_memory: The maximum amount of memory (in bytes) to
             allow the object store to use.
+        redis_max_memory: The max amount of memory (in bytes) to allow redis
+            to use, or None for no limit. Once the limit is exceeded, redis
+            will start LRU eviction of entries. This only applies to the
+            sharded redis tables (task and object tables).
+        collect_profiling_data: Whether to collect profiling data from workers.
         local_mode (bool): True if the code should be executed serially
             without Ray. This is useful for debugging.
         redirect_worker_output: True if the stdout and stderr of worker
@@ -1577,13 +1414,23 @@ def _init(address_info=None,
             the primary Redis shard.
         redis_max_clients: If provided, attempt to configure Redis with this
             maxclients number.
+        redis_password (str): Prevents external clients without the password
+            from connecting to Redis if provided.
         plasma_directory: A directory where the Plasma memory mapped files will
             be created.
         huge_pages: Boolean flag indicating whether to start the Object
             Store with hugetlbfs support. Requires plasma_directory.
         include_webui: Boolean flag indicating whether to start the web
             UI, which is a Jupyter notebook.
-        use_raylet: True if the new raylet code path should be used.
+        driver_id: The ID of driver.
+        plasma_store_socket_name (str): If provided, it will specify the socket
+            name used by the plasma store.
+        raylet_socket_name (str): If provided, it will specify the socket path
+            used by the raylet process.
+        temp_dir (str): If provided, it will specify the root temporary
+            directory for the Ray process.
+        _internal_config (str): JSON configuration for overriding
+            RayConfig defaults. For testing purposes ONLY.
 
     Returns:
         Address information about the started processes.
@@ -1600,10 +1447,10 @@ def _init(address_info=None,
     else:
         driver_mode = SCRIPT_MODE
 
-    if use_raylet is None and os.environ.get("RAY_USE_XRAY") == "1":
-        # This environment variable is used in our testing setup.
-        logger.info("Detected environment variable 'RAY_USE_XRAY'.")
-        use_raylet = True
+    if redis_max_memory and collect_profiling_data:
+        logger.warn("Profiling data cannot be LRU evicted, so it is disabled "
+                    "when redis_max_memory is set.")
+        collect_profiling_data = False
 
     # Get addresses of existing services.
     if address_info is None:
@@ -1626,12 +1473,8 @@ def _init(address_info=None,
         # Use 1 local scheduler if num_local_schedulers is not provided. If
         # existing local schedulers are provided, use that count as
         # num_local_schedulers.
-        local_schedulers = address_info.get("local_scheduler_socket_names", [])
         if num_local_schedulers is None:
-            if len(local_schedulers) > 0:
-                num_local_schedulers = len(local_schedulers)
-            else:
-                num_local_schedulers = 1
+            num_local_schedulers = 1
         # Use 1 additional redis shard if num_redis_shards is not provided.
         num_redis_shards = 1 if num_redis_shards is None else num_redis_shards
 
@@ -1648,6 +1491,8 @@ def _init(address_info=None,
             num_workers=num_workers,
             num_local_schedulers=num_local_schedulers,
             object_store_memory=object_store_memory,
+            redis_max_memory=redis_max_memory,
+            collect_profiling_data=collect_profiling_data,
             redirect_worker_output=redirect_worker_output,
             redirect_output=redirect_output,
             start_workers_from_local_scheduler=(
@@ -1655,10 +1500,14 @@ def _init(address_info=None,
             resources=resources,
             num_redis_shards=num_redis_shards,
             redis_max_clients=redis_max_clients,
+            redis_password=redis_password,
             plasma_directory=plasma_directory,
             huge_pages=huge_pages,
             include_webui=include_webui,
-            use_raylet=use_raylet)
+            plasma_store_socket_name=plasma_store_socket_name,
+            raylet_socket_name=raylet_socket_name,
+            temp_dir=temp_dir,
+            _internal_config=_internal_config)
     else:
         if redis_address is None:
             raise Exception("When connecting to an existing cluster, "
@@ -1684,18 +1533,34 @@ def _init(address_info=None,
         if object_store_memory is not None:
             raise Exception("When connecting to an existing cluster, "
                             "object_store_memory must not be provided.")
+        if redis_max_memory is not None:
+            raise Exception("When connecting to an existing cluster, "
+                            "redis_max_memory must not be provided.")
         if plasma_directory is not None:
             raise Exception("When connecting to an existing cluster, "
                             "plasma_directory must not be provided.")
         if huge_pages:
             raise Exception("When connecting to an existing cluster, "
                             "huge_pages must not be provided.")
+        if temp_dir is not None:
+            raise Exception("When connecting to an existing cluster, "
+                            "temp_dir must not be provided.")
+        if plasma_store_socket_name is not None:
+            raise Exception("When connecting to an existing cluster, "
+                            "plasma_store_socket_name must not be provided.")
+        if raylet_socket_name is not None:
+            raise Exception("When connecting to an existing cluster, "
+                            "raylet_socket_name must not be provided.")
+        if _internal_config is not None:
+            raise Exception("When connecting to an existing cluster, "
+                            "_internal_config must not be provided.")
+
         # Get the node IP address if one is not provided.
         if node_ip_address is None:
             node_ip_address = services.get_node_ip_address(redis_address)
         # Get the address info of the processes to connect to from Redis.
         address_info = get_address_info_from_redis(
-            redis_address, node_ip_address, use_raylet=use_raylet)
+            redis_address, node_ip_address, redis_password=redis_password)
 
     # Connect this driver to Redis, the object store, and the local scheduler.
     # Choose the first object store and local scheduler if there are multiple.
@@ -1707,24 +1572,22 @@ def _init(address_info=None,
         driver_address_info = {
             "node_ip_address": node_ip_address,
             "redis_address": address_info["redis_address"],
-            "store_socket_name": (
-                address_info["object_store_addresses"][0].name),
-            "webui_url": address_info["webui_url"]
+            "store_socket_name": address_info["object_store_addresses"][0],
+            "webui_url": address_info["webui_url"],
         }
-        if not use_raylet:
-            driver_address_info["manager_socket_name"] = (
-                address_info["object_store_addresses"][0].manager_name)
-            driver_address_info["local_scheduler_socket_name"] = (
-                address_info["local_scheduler_socket_names"][0])
-        else:
-            driver_address_info["raylet_socket_name"] = (
-                address_info["raylet_socket_names"][0])
+        driver_address_info["raylet_socket_name"] = (
+            address_info["raylet_socket_names"][0])
+
+    # We only pass `temp_dir` to a worker (WORKER_MODE).
+    # It can't be a worker here.
     connect(
         driver_address_info,
         object_id_seed=object_id_seed,
         mode=driver_mode,
         worker=global_worker,
-        use_raylet=use_raylet)
+        driver_id=driver_id,
+        redis_password=redis_password,
+        collect_profiling_data=collect_profiling_data)
     return address_info
 
 
@@ -1733,6 +1596,8 @@ def init(redis_address=None,
          num_gpus=None,
          resources=None,
          object_store_memory=None,
+         redis_max_memory=None,
+         collect_profiling_data=True,
          node_ip_address=None,
          object_id_seed=None,
          num_workers=None,
@@ -1743,14 +1608,19 @@ def init(redis_address=None,
          ignore_reinit_error=False,
          num_redis_shards=None,
          redis_max_clients=None,
-         redis_protected_mode=True,
+         redis_password=None,
          plasma_directory=None,
          huge_pages=False,
          include_webui=True,
-         use_raylet=None,
+         driver_id=None,
          configure_logging=True,
          logging_level=logging.INFO,
-         logging_format=ray_constants.LOGGER_FORMAT):
+         logging_format=ray_constants.LOGGER_FORMAT,
+         plasma_store_socket_name=None,
+         raylet_socket_name=None,
+         temp_dir=None,
+         _internal_config=None,
+         use_raylet=None):
     """Connect to an existing Ray cluster or start one and connect to it.
 
     This method handles two cases. Either a Ray cluster already exists and we
@@ -1784,13 +1654,16 @@ def init(redis_address=None,
             of that resource available.
         object_store_memory: The amount of memory (in bytes) to start the
             object store with.
+        redis_max_memory: The max amount of memory (in bytes) to allow redis
+            to use, or None for no limit. Once the limit is exceeded, redis
+            will start LRU eviction of entries. This only applies to the
+            sharded redis tables (task and object tables).
+        collect_profiling_data: Whether to collect profiling data from workers.
         node_ip_address (str): The IP address of the node that we are on.
         object_id_seed (int): Used to seed the deterministic generation of
             object IDs. The same value can be used across multiple runs of the
             same job in order to generate the object IDs in a consistent
             manner. However, the same ID should not be used for different jobs.
-        num_workers (int): The number of workers to start. This is only
-            provided if redis_address is not provided.
         local_mode (bool): True if the code should be executed serially
             without Ray. This is useful for debugging.
         redirect_worker_output: True if the stdout and stderr of worker
@@ -1803,18 +1676,28 @@ def init(redis_address=None,
             the primary Redis shard.
         redis_max_clients: If provided, attempt to configure Redis with this
             maxclients number.
+        redis_password (str): Prevents external clients without the password
+            from connecting to Redis if provided.
         plasma_directory: A directory where the Plasma memory mapped files will
             be created.
         huge_pages: Boolean flag indicating whether to start the Object
             Store with hugetlbfs support. Requires plasma_directory.
         include_webui: Boolean flag indicating whether to start the web
             UI, which is a Jupyter notebook.
-        use_raylet: True if the new raylet code path should be used.
+        driver_id: The ID of driver.
         configure_logging: True if allow the logging cofiguration here.
             Otherwise, the users may want to configure it by their own.
-        logging_level: Logging level, default will be loging.INFO.
+        logging_level: Logging level, default will be logging.INFO.
         logging_format: Logging format, default will be "%(message)s"
             which means only contains the message.
+        plasma_store_socket_name (str): If provided, it will specify the socket
+            name used by the plasma store.
+        raylet_socket_name (str): If provided, it will specify the socket path
+            used by the raylet process.
+        temp_dir (str): If provided, it will specify the root temporary
+            directory for the Ray process.
+        _internal_config (str): JSON configuration for overriding
+            RayConfig defaults. For testing purposes ONLY.
 
     Returns:
         Address information about the started processes.
@@ -1823,9 +1706,25 @@ def init(redis_address=None,
         Exception: An exception is raised if an inappropriate combination of
             arguments is passed in.
     """
+
     if configure_logging:
         logging.basicConfig(level=logging_level, format=logging_format)
 
+    # Add the use_raylet option for backwards compatibility.
+    if use_raylet is not None:
+        if use_raylet:
+            logger.warn("WARNING: The use_raylet argument has been "
+                        "deprecated. Please remove it.")
+        else:
+            raise DeprecationWarning("The use_raylet argument is deprecated. "
+                                     "Please remove it.")
+
+    if setproctitle is None:
+        logger.warning(
+            "WARNING: Not updating worker name since `setproctitle` is not "
+            "installed. Install this with `pip install setproctitle` "
+            "(or ray[debug]) to enable monitoring of worker processes.")
+
     if global_worker.connected:
         if ignore_reinit_error:
             logger.error("Calling ray.init() again after it has already been "
@@ -1834,11 +1733,6 @@ def init(redis_address=None,
         else:
             raise Exception("Perhaps you called ray.init twice by accident?")
 
-    if use_raylet is None and os.environ.get("RAY_USE_XRAY") == "1":
-        # This environment variable is used in our testing setup.
-        logger.info("Detected environment variable 'RAY_USE_XRAY'.")
-        use_raylet = True
-
     # Convert hostnames to numerical IP address.
     if node_ip_address is not None:
         node_ip_address = services.address_to_ip(node_ip_address)
@@ -1850,6 +1744,7 @@ def init(redis_address=None,
         address_info=info,
         start_ray_local=(redis_address is None),
         num_workers=num_workers,
+        object_id_seed=object_id_seed,
         local_mode=local_mode,
         driver_mode=driver_mode,
         redirect_worker_output=redirect_worker_output,
@@ -1859,11 +1754,18 @@ def init(redis_address=None,
         resources=resources,
         num_redis_shards=num_redis_shards,
         redis_max_clients=redis_max_clients,
+        redis_password=redis_password,
         plasma_directory=plasma_directory,
         huge_pages=huge_pages,
         include_webui=include_webui,
         object_store_memory=object_store_memory,
-        use_raylet=use_raylet)
+        redis_max_memory=redis_max_memory,
+        collect_profiling_data=collect_profiling_data,
+        driver_id=driver_id,
+        plasma_store_socket_name=plasma_store_socket_name,
+        raylet_socket_name=raylet_socket_name,
+        temp_dir=temp_dir,
+        _internal_config=_internal_config)
     for hook in _post_init_hooks:
         hook()
     return ret
@@ -1899,19 +1801,15 @@ def shutdown(worker=global_worker):
         worker.plasma_client.disconnect()
 
     if worker.mode == SCRIPT_MODE:
-        # If this is a driver, push the finish time to Redis and clean up any
-        # other services that were started with the driver.
-        worker.redis_client.hmset(b"Drivers:" + worker.worker_id,
-                                  {"end_time": time.time()})
         services.cleanup()
     else:
         # If this is not a driver, make sure there are no orphan processes,
         # besides possibly the worker itself.
         for process_type, processes in services.all_processes.items():
             if process_type == services.PROCESS_TYPE_WORKER:
-                assert (len(processes)) <= 1
+                assert len(processes) <= 1
             else:
-                assert (len(processes) == 0)
+                assert len(processes) == 0
 
     worker.set_mode(None)
 
@@ -1942,9 +1840,6 @@ def print_error_messages_raylet(worker):
     This runs in a separate thread on the driver and prints error messages in
     the background.
     """
-    if not worker.use_raylet:
-        raise Exception("This function is specific to the raylet code path.")
-
     worker.error_message_pubsub_client = worker.redis_client.pubsub(
         ignore_subscribe_messages=True)
     # Exports that are published after the call to
@@ -2014,12 +1909,6 @@ def print_error_messages(worker):
     worker.error_message_pubsub_client.subscribe("__keyspace@0__:ErrorKeys")
     num_errors_received = 0
 
-    # Keep a set of all the error messages that we've seen so far in order to
-    # avoid printing the same error message repeatedly. This is especially
-    # important when running a script inside of a tool like screen where
-    # scrolling is difficult.
-    old_error_messages = set()
-
     # Get the exports that occurred before the call to subscribe.
     with worker.lock:
         error_keys = worker.redis_client.lrange("ErrorKeys", 0, -1)
@@ -2027,11 +1916,7 @@ def print_error_messages(worker):
             if error_applies_to_driver(error_key, worker=worker):
                 error_message = ray.utils.decode(
                     worker.redis_client.hget(error_key, "message"))
-                if error_message not in old_error_messages:
-                    logger.error(error_message)
-                    old_error_messages.add(error_message)
-                else:
-                    logger.error("Suppressing duplicate error message.")
+                logger.error(error_message)
             num_errors_received += 1
 
     try:
@@ -2042,12 +1927,7 @@ def print_error_messages(worker):
                     if error_applies_to_driver(error_key, worker=worker):
                         error_message = ray.utils.decode(
                             worker.redis_client.hget(error_key, "message"))
-                        if error_message not in old_error_messages:
-                            logger.error(error_message)
-                            old_error_messages.add(error_message)
-                        else:
-                            logger.error(
-                                "Suppressing duplicate error message.")
+                        logger.error(error_message)
                     num_errors_received += 1
     except redis.ConnectionError:
         # When Redis terminates the listen call will throw a ConnectionError,
@@ -2059,7 +1939,9 @@ def connect(info,
             object_id_seed=None,
             mode=WORKER_MODE,
             worker=global_worker,
-            use_raylet=False):
+            driver_id=None,
+            redis_password=None,
+            collect_profiling_data=True):
     """Connect this worker to the local scheduler, to Plasma, and to Redis.
 
     Args:
@@ -2069,15 +1951,39 @@ def connect(info,
             deterministic.
         mode: The mode of the worker. One of SCRIPT_MODE, WORKER_MODE, and
             LOCAL_MODE.
-        use_raylet: True if the new raylet code path should be used.
+        driver_id: The ID of driver. If it's None, then we will generate one.
+        redis_password (str): Prevents external clients without the password
+            from connecting to Redis if provided.
+        collect_profiling_data: Whether to collect profiling data from workers.
     """
     # Do some basic checking to make sure we didn't call ray.init twice.
     error_message = "Perhaps you called ray.init twice by accident?"
     assert not worker.connected, error_message
     assert worker.cached_functions_to_run is not None, error_message
-    assert worker.cached_remote_functions_and_actors is not None, error_message
+
+    # Enable nice stack traces on SIGSEGV etc.
+    faulthandler.enable(all_threads=False)
+
+    if collect_profiling_data:
+        worker.profiler = profiling.Profiler(worker)
+    else:
+        worker.profiler = profiling.NoopProfiler()
+
     # Initialize some fields.
-    worker.worker_id = random_string()
+    if mode is WORKER_MODE:
+        worker.worker_id = random_string()
+        if setproctitle:
+            setproctitle.setproctitle("ray_worker")
+    else:
+        # This is the code path of driver mode.
+        if driver_id is None:
+            driver_id = ray.ObjectID(random_string())
+
+        if not isinstance(driver_id, ray.ObjectID):
+            raise Exception(
+                "The type of given driver id must be ray.ObjectID.")
+
+        worker.worker_id = driver_id.id()
 
     # When tasks are executed on remote workers in the context of multiple
     # drivers, the task driver ID is used to keep track of which driver is
@@ -2091,7 +1997,6 @@ def connect(info,
     worker.actor_id = NIL_ACTOR_ID
     worker.connected = True
     worker.set_mode(mode)
-    worker.use_raylet = use_raylet
 
     # If running Ray in LOCAL_MODE, there is no need to create call
     # create_worker or to start the worker service.
@@ -2104,7 +2009,10 @@ def connect(info,
     # Create a Redis client.
     redis_ip_address, redis_port = info["redis_address"].split(":")
     worker.redis_client = thread_safe_client(
-        redis.StrictRedis(host=redis_ip_address, port=int(redis_port)))
+        redis.StrictRedis(
+            host=redis_ip_address,
+            port=int(redis_port),
+            password=redis_password))
 
     # For driver's check that the version information matches the version
     # information that the Ray cluster was started with.
@@ -2117,7 +2025,6 @@ def connect(info,
             traceback_str = traceback.format_exc()
             ray.utils.push_error_to_driver_through_redis(
                 worker.redis_client,
-                worker.use_raylet,
                 ray_constants.VERSION_MISMATCH_PUSH_ERROR,
                 traceback_str,
                 driver_id=None)
@@ -2135,16 +2042,19 @@ def connect(info,
         else:
             redirect_worker_output = 0
         if redirect_worker_output:
-            log_stdout_file, log_stderr_file = services.new_log_files(
-                "worker", True)
+            log_stdout_file, log_stderr_file = (
+                tempfile_services.new_worker_redirected_log_file(
+                    worker.worker_id))
             sys.stdout = log_stdout_file
             sys.stderr = log_stderr_file
             services.record_log_files_in_redis(
-                info["redis_address"], info["node_ip_address"],
-                [log_stdout_file, log_stderr_file])
+                info["redis_address"],
+                info["node_ip_address"], [log_stdout_file, log_stderr_file],
+                password=redis_password)
 
     # Create an object for interfacing with the global state.
-    global_state._initialize_global_state(redis_ip_address, int(redis_port))
+    global_state._initialize_global_state(
+        redis_ip_address, int(redis_port), redis_password=redis_password)
 
     # Register the worker with Redis.
     if mode == SCRIPT_MODE:
@@ -2156,14 +2066,13 @@ def connect(info,
             "driver_id": worker.worker_id,
             "start_time": time.time(),
             "plasma_store_socket": info["store_socket_name"],
-            "plasma_manager_socket": info.get("manager_socket_name"),
-            "local_scheduler_socket": info.get("local_scheduler_socket_name"),
             "raylet_socket": info.get("raylet_socket_name")
         }
         driver_info["name"] = (main.__file__ if hasattr(main, "__file__") else
                                "INTERACTIVE MODE")
         worker.redis_client.hmset(b"Drivers:" + worker.worker_id, driver_info)
-        if not worker.redis_client.exists("webui"):
+        if (not worker.redis_client.exists("webui")
+                and info["webui_url"] is not None):
             worker.redis_client.hmset("webui", {"url": info["webui_url"]})
         is_worker = False
     elif mode == WORKER_MODE:
@@ -2171,8 +2080,6 @@ def connect(info,
         worker_dict = {
             "node_ip_address": worker.node_ip_address,
             "plasma_store_socket": info["store_socket_name"],
-            "plasma_manager_socket": info["manager_socket_name"],
-            "local_scheduler_socket": info["local_scheduler_socket_name"]
         }
         if redirect_worker_output:
             worker_dict["stdout_file"] = os.path.abspath(log_stdout_file.name)
@@ -2183,18 +2090,10 @@ def connect(info,
         raise Exception("This code should be unreachable.")
 
     # Create an object store client.
-    if not worker.use_raylet:
-        worker.plasma_client = thread_safe_client(
-            plasma.connect(info["store_socket_name"],
-                           info["manager_socket_name"], 64))
-    else:
-        worker.plasma_client = thread_safe_client(
-            plasma.connect(info["store_socket_name"], "", 64))
+    worker.plasma_client = thread_safe_client(
+        plasma.connect(info["store_socket_name"], "", 64))
 
-    if not worker.use_raylet:
-        local_scheduler_socket = info["local_scheduler_socket_name"]
-    else:
-        local_scheduler_socket = info["raylet_socket_name"]
+    raylet_socket = info["raylet_socket_name"]
 
     # If this is a driver, set the current task ID, the task driver ID, and set
     # the task index to 0.
@@ -2225,28 +2124,22 @@ def connect(info,
         # rerun the driver.
         nil_actor_counter = 0
 
-        driver_task = ray.local_scheduler.Task(
-            worker.task_driver_id, ray.ObjectID(NIL_FUNCTION_ID), [], 0,
-            worker.current_task_id, worker.task_index,
-            ray.ObjectID(NIL_ACTOR_ID), ray.ObjectID(NIL_ACTOR_ID),
-            ray.ObjectID(NIL_ACTOR_ID), ray.ObjectID(NIL_ACTOR_ID),
-            nil_actor_counter, False, [], {"CPU": 0}, worker.use_raylet)
+        driver_task = ray.raylet.Task(worker.task_driver_id,
+                                      ray.ObjectID(NIL_FUNCTION_ID), [], 0,
+                                      worker.current_task_id,
+                                      worker.task_index,
+                                      ray.ObjectID(NIL_ACTOR_ID),
+                                      ray.ObjectID(NIL_ACTOR_ID),
+                                      ray.ObjectID(NIL_ACTOR_ID),
+                                      ray.ObjectID(NIL_ACTOR_ID),
+                                      nil_actor_counter, [], {"CPU": 0}, {})
 
         # Add the driver task to the task table.
-        if not worker.use_raylet:
-            global_state._execute_command(
-                driver_task.task_id(), "RAY.TASK_TABLE_ADD",
-                driver_task.task_id().id(), TASK_STATUS_RUNNING,
-                NIL_LOCAL_SCHEDULER_ID,
-                driver_task.execution_dependencies_string(), 0,
-                ray.local_scheduler.task_to_string(driver_task))
-        else:
-            global_state._execute_command(
-                driver_task.task_id(), "RAY.TABLE_ADD",
-                ray.gcs_utils.TablePrefix.RAYLET_TASK,
-                ray.gcs_utils.TablePubsub.RAYLET_TASK,
-                driver_task.task_id().id(),
-                driver_task._serialized_raylet_task())
+        global_state._execute_command(driver_task.task_id(), "RAY.TABLE_ADD",
+                                      ray.gcs_utils.TablePrefix.RAYLET_TASK,
+                                      ray.gcs_utils.TablePubsub.RAYLET_TASK,
+                                      driver_task.task_id().id(),
+                                      driver_task._serialized_raylet_task())
 
         # Set the driver's current task ID to the task ID assigned to the
         # driver task.
@@ -2254,10 +2147,12 @@ def connect(info,
     else:
         # A non-driver worker begins without an assigned task.
         worker.current_task_id = ray.ObjectID(NIL_ID)
+    # A flag for making sure that we only print one warning message about
+    # multithreading per worker.
+    worker.multithreading_warned = False
 
-    worker.local_scheduler_client = ray.local_scheduler.LocalSchedulerClient(
-        local_scheduler_socket, worker.worker_id, is_worker,
-        worker.current_task_id, worker.use_raylet)
+    worker.local_scheduler_client = ray.raylet.LocalSchedulerClient(
+        raylet_socket, worker.worker_id, is_worker, worker.current_task_id)
 
     # Start the import thread
     import_thread.ImportThread(worker, mode).start()
@@ -2269,16 +2164,10 @@ def connect(info,
     # temporarily using this implementation which constantly queries the
     # scheduler for new error messages.
     if mode == SCRIPT_MODE:
-        if not worker.use_raylet:
-            t = threading.Thread(
-                target=print_error_messages,
-                name="ray_print_error_messages",
-                args=(worker, ))
-        else:
-            t = threading.Thread(
-                target=print_error_messages_raylet,
-                name="ray_print_error_messages",
-                args=(worker, ))
+        t = threading.Thread(
+            target=print_error_messages_raylet,
+            name="ray_print_error_messages",
+            args=(worker, ))
         # Making the thread a daemon causes it to exit when the main thread
         # exits.
         t.daemon = True
@@ -2286,7 +2175,7 @@ def connect(info,
 
     # If we are using the raylet code path and we are not in local mode, start
     # a background thread to periodically flush profiling data to the GCS.
-    if mode != LOCAL_MODE and worker.use_raylet:
+    if mode != LOCAL_MODE:
         worker.profiler.start_flush_thread()
 
     if mode == SCRIPT_MODE:
@@ -2312,18 +2201,9 @@ def connect(info,
         # Export cached functions_to_run.
         for function in worker.cached_functions_to_run:
             worker.run_function_on_all_workers(function)
-        # Export cached remote functions to the workers.
-        for cached_type, info in worker.cached_remote_functions_and_actors:
-            if cached_type == "remote_function":
-                info._export()
-            elif cached_type == "actor":
-                (key, actor_class_info) = info
-                ray.actor.publish_actor_class_to_key(key, actor_class_info,
-                                                     worker)
-            else:
-                assert False, "This code should be unreachable."
+        # Export cached remote functions and actors to the workers.
+        worker.function_actor_manager.export_cached()
     worker.cached_functions_to_run = None
-    worker.cached_remote_functions_and_actors = None
 
 
 def disconnect(worker=global_worker):
@@ -2334,10 +2214,19 @@ def disconnect(worker=global_worker):
     # tests.
     worker.connected = False
     worker.cached_functions_to_run = []
-    worker.cached_remote_functions_and_actors = []
+    worker.function_actor_manager.reset_cache()
     worker.serialization_context_map.clear()
 
 
+@contextmanager
+def _changeproctitle(title, next_title):
+    if setproctitle:
+        setproctitle.setproctitle(title)
+    yield
+    if setproctitle:
+        setproctitle.setproctitle(next_title)
+
+
 def _try_to_compute_deterministic_class_id(cls, depth=5):
     """Attempt to produce a deterministic class ID for a given class.
 
@@ -2444,7 +2333,7 @@ def register_custom_serializer(cls,
                 # worker. However, determinism is not guaranteed, and the
                 # result may be different on different workers.
                 class_id = _try_to_compute_deterministic_class_id(cls)
-            except Exception as e:
+            except Exception:
                 raise serialization.CloudPickleError("Failed to pickle class "
                                                      "'{}'".format(cls))
         else:
@@ -2452,6 +2341,9 @@ def register_custom_serializer(cls,
             # worker and not across workers.
             class_id = random_string()
 
+        # Make sure class_id is a string.
+        class_id = ray.utils.binary_to_hex(class_id)
+
     if driver_id is None:
         driver_id_bytes = worker.task_driver_id.id()
     else:
@@ -2538,7 +2430,7 @@ def put(value, worker=global_worker):
             # In LOCAL_MODE, ray.put is the identity operation.
             return value
         object_id = worker.local_scheduler_client.compute_put_id(
-            worker.current_task_id, worker.put_index, worker.use_raylet)
+            worker.current_task_id, worker.put_index)
         worker.put_object(object_id, value)
         worker.put_index += 1
         return object_id
@@ -2590,6 +2482,7 @@ def wait(object_ids, num_returns=1, timeout=None, worker=global_worker):
                                     type(object_id)))
 
     worker.check_connected()
+    # TODO(swang): Check main thread.
     with profiling.profile("ray.wait", worker=worker):
         # When Ray is run in LOCAL_MODE, all functions are run immediately,
         # so all objects in object_id are ready.
@@ -2610,22 +2503,14 @@ def wait(object_ids, num_returns=1, timeout=None, worker=global_worker):
         if num_returns > len(object_ids):
             raise Exception("num_returns cannot be greater than the number "
                             "of objects provided to ray.wait.")
+
+        # Get the task ID, to notify the backend which task is blocked.
+        with worker.state_lock:
+            current_task_id = worker.get_current_thread_task_id()
+
         timeout = timeout if timeout is not None else 2**30
-        if worker.use_raylet:
-            ready_ids, remaining_ids = worker.local_scheduler_client.wait(
-                object_ids, num_returns, timeout, False)
-        else:
-            object_id_strs = [
-                plasma.ObjectID(object_id.id()) for object_id in object_ids
-            ]
-            ready_ids, remaining_ids = worker.plasma_client.wait(
-                object_id_strs, timeout, num_returns)
-            ready_ids = [
-                ray.ObjectID(object_id.binary()) for object_id in ready_ids
-            ]
-            remaining_ids = [
-                ray.ObjectID(object_id.binary()) for object_id in remaining_ids
-            ]
+        ready_ids, remaining_ids = worker.local_scheduler_client.wait(
+            object_ids, num_returns, timeout, False, current_task_id)
         return ready_ids, remaining_ids
 
 
diff --git a/python/ray/workers/default_worker.py b/python/ray/workers/default_worker.py
index cd7b3f4a45c35..dc1085783b8aa 100644
--- a/python/ray/workers/default_worker.py
+++ b/python/ray/workers/default_worker.py
@@ -9,6 +9,7 @@
 import ray
 import ray.actor
 import ray.ray_constants as ray_constants
+import ray.tempfile_services as tempfile_services
 
 parser = argparse.ArgumentParser(
     description=("Parse addresses for the worker "
@@ -23,6 +24,12 @@
     required=True,
     type=str,
     help="the address to use for Redis")
+parser.add_argument(
+    "--redis-password",
+    required=False,
+    type=str,
+    default=None,
+    help="the password to use for Redis")
 parser.add_argument(
     "--object-store-name",
     required=True,
@@ -33,11 +40,6 @@
     required=False,
     type=str,
     help="the object store manager's name")
-parser.add_argument(
-    "--local-scheduler-name",
-    required=False,
-    type=str,
-    help="the local scheduler's name")
 parser.add_argument(
     "--raylet-name", required=False, type=str, help="the raylet's name")
 parser.add_argument(
@@ -53,6 +55,17 @@
     type=str,
     default=ray_constants.LOGGER_FORMAT,
     help=ray_constants.LOGGER_FORMAT_HELP)
+parser.add_argument(
+    "--collect-profiling-data",
+    type=int,  # int since argparse can't handle bool values
+    default=1,
+    help="Whether to collect profiling data from workers.")
+parser.add_argument(
+    "--temp-dir",
+    required=False,
+    type=str,
+    default=None,
+    help="Specify the path of the temporary directory use by Ray process.")
 
 if __name__ == "__main__":
     args = parser.parse_args()
@@ -60,18 +73,24 @@
     info = {
         "node_ip_address": args.node_ip_address,
         "redis_address": args.redis_address,
+        "redis_password": args.redis_password,
         "store_socket_name": args.object_store_name,
         "manager_socket_name": args.object_store_manager_name,
-        "local_scheduler_socket_name": args.local_scheduler_name,
-        "raylet_socket_name": args.raylet_name
+        "raylet_socket_name": args.raylet_name,
     }
 
     logging.basicConfig(
         level=logging.getLevelName(args.logging_level.upper()),
         format=args.logging_format)
 
+    # Override the temporary directory.
+    tempfile_services.set_temp_root(args.temp_dir)
+
     ray.worker.connect(
-        info, mode=ray.WORKER_MODE, use_raylet=(args.raylet_name is not None))
+        info,
+        mode=ray.WORKER_MODE,
+        redis_password=args.redis_password,
+        collect_profiling_data=args.collect_profiling_data)
 
     error_explanation = """
   This error is unexpected and should not have happened. Somehow a worker
@@ -86,7 +105,7 @@
         # main_loop. If an exception is thrown here, then that means that
         # there is some error that we didn't anticipate.
         ray.worker.global_worker.main_loop()
-    except Exception as e:
+    except Exception:
         traceback_str = traceback.format_exc() + error_explanation
         ray.utils.push_error_to_driver(
             ray.worker.global_worker,
diff --git a/python/setup.py b/python/setup.py
index 70d7cd87fadb7..c92ffa65b481d 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -3,6 +3,7 @@
 from __future__ import print_function
 
 import os
+import re
 import shutil
 import subprocess
 import sys
@@ -19,13 +20,10 @@
 # NOTE: The lists below must be kept in sync with ray/CMakeLists.txt.
 
 ray_files = [
-    "ray/core/src/common/thirdparty/redis/src/redis-server",
-    "ray/core/src/common/redis_module/libray_redis_module.so",
+    "ray/core/src/ray/thirdparty/redis/src/redis-server",
+    "ray/core/src/ray/gcs/redis_module/libray_redis_module.so",
     "ray/core/src/plasma/plasma_store_server",
-    "ray/core/src/plasma/plasma_manager",
-    "ray/core/src/local_scheduler/local_scheduler",
-    "ray/core/src/local_scheduler/liblocal_scheduler_library_python.so",
-    "ray/core/src/global_scheduler/global_scheduler",
+    "ray/core/src/ray/raylet/liblocal_scheduler_library_python.so",
     "ray/core/src/ray/raylet/raylet_monitor", "ray/core/src/ray/raylet/raylet",
     "ray/WebUI.ipynb"
 ]
@@ -47,6 +45,7 @@
 ray_autoscaler_files = [
     "ray/autoscaler/aws/example-full.yaml",
     "ray/autoscaler/gcp/example-full.yaml",
+    "ray/autoscaler/local/example-full.yaml",
 ]
 
 if "RAY_USE_NEW_GCS" in os.environ and os.environ["RAY_USE_NEW_GCS"] == "on":
@@ -65,7 +64,10 @@
 
 optional_ray_files += ray_autoscaler_files
 
-extras = {"rllib": ["pyyaml", "gym[atari]", "opencv-python", "lz4", "scipy"]}
+extras = {
+    "rllib": ["pyyaml", "gym[atari]", "opencv-python", "lz4", "scipy"],
+    "debug": ["psutil", "setproctitle", "py-spy"],
+}
 
 
 class build_ext(_build_ext.build_ext):
@@ -98,7 +100,7 @@ def run(self):
         for filename in optional_ray_files:
             try:
                 self.move_file(filename)
-            except Exception as e:
+            except Exception:
                 print("Failed to copy optional file {}. This is ok."
                       .format(filename))
 
@@ -121,26 +123,47 @@ def has_ext_modules(self):
         return True
 
 
+def find_version(*filepath):
+    # Extract version information from filepath
+    here = os.path.abspath(os.path.dirname(__file__))
+    with open(os.path.join(here, *filepath)) as fp:
+        version_match = re.search(r"^__version__ = ['\"]([^'\"]*)['\"]",
+                                  fp.read(), re.M)
+        if version_match:
+            return version_match.group(1)
+        raise RuntimeError("Unable to find version string.")
+
+
+requires = [
+    "numpy",
+    "funcsigs",
+    "click",
+    "colorama",
+    "pytest",
+    "pyyaml",
+    "redis",
+    # The six module is required by pyarrow.
+    "six >= 1.0.0",
+    "flatbuffers",
+]
+
+if sys.version_info < (3, 0):
+    requires.append("faulthandler")
+
 setup(
     name="ray",
-    # The version string is also in __init__.py. TODO(pcm): Fix this.
-    version="0.5.3",
+    version=find_version("ray", "__init__.py"),
+    description=("A system for parallel and distributed Python that unifies "
+                 "the ML ecosystem."),
+    long_description=open("../README.rst").read(),
+    url="https://github.com/ray-project/ray",
+    keywords=("ray distributed parallel machine-learning "
+              "reinforcement-learning deep-learning python"),
     packages=find_packages(),
     cmdclass={"build_ext": build_ext},
     # The BinaryDistribution argument triggers build_ext.
     distclass=BinaryDistribution,
-    install_requires=[
-        "numpy",
-        "funcsigs",
-        "click",
-        "colorama",
-        "pytest",
-        "pyyaml",
-        "redis",
-        # The six module is required by pyarrow.
-        "six >= 1.0.0",
-        "flatbuffers"
-    ],
+    install_requires=requires,
     setup_requires=["cython >= 0.27, < 0.28"],
     extras_require=extras,
     entry_points={
diff --git a/site/Gemfile b/site/Gemfile
index 8af267397b31b..9ae4bf67ff67d 100644
--- a/site/Gemfile
+++ b/site/Gemfile
@@ -9,7 +9,7 @@ ruby RUBY_VERSION
 #
 # This will help ensure the proper Jekyll version is running.
 # Happy Jekylling!
-gem "jekyll", "3.4.3"
+gem "jekyll", ">= 3.6.3"
 
 # This is the default theme for new Jekyll sites. You may change this to anything you like.
 gem "minima", "~> 2.0"
diff --git a/src/common/CMakeLists.txt b/src/common/CMakeLists.txt
deleted file mode 100644
index b024b4a0419f3..0000000000000
--- a/src/common/CMakeLists.txt
+++ /dev/null
@@ -1,131 +0,0 @@
-cmake_minimum_required(VERSION 3.4)
-
-project(common)
-
-if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
-  include_directories("${CMAKE_CURRENT_LIST_DIR}/lib/python")
-endif ()
-
-add_subdirectory(redis_module)
-
-set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fPIC -g")
-
-include_directories(thirdparty/ae)
-
-# Compile flatbuffers
-
-set(COMMON_FBS_SRC "${CMAKE_CURRENT_LIST_DIR}/format/common.fbs")
-set(OUTPUT_DIR ${CMAKE_CURRENT_LIST_DIR}/format/)
-
-set(COMMON_FBS_OUTPUT_FILES
-  "${OUTPUT_DIR}/common_generated.h")
-
-add_custom_target(gen_common_fbs DEPENDS ${COMMON_FBS_OUTPUT_FILES})
-
-add_custom_command(
-  OUTPUT ${COMMON_FBS_OUTPUT_FILES}
-  # The --gen-object-api flag generates a C++ class MessageT for each
-  # flatbuffers message Message, which can be used to store deserialized
-  # messages in data structures. This is currently used for ObjectInfo for
-  # example.
-  COMMAND ${FLATBUFFERS_COMPILER} -c -o ${OUTPUT_DIR} ${COMMON_FBS_SRC} --gen-object-api --scoped-enums
-  DEPENDS ${FBS_DEPENDS}
-  COMMENT "Running flatc compiler on ${COMMON_FBS_SRC}"
-  VERBATIM)
-
-if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
-  add_custom_target(gen_common_python_fbs DEPENDS ${COMMON_FBS_OUTPUT_FILES})
-
-  # Generate Python bindings for the flatbuffers objects.
-  set(PYTHON_OUTPUT_DIR ${CMAKE_CURRENT_LIST_DIR}/../../python/ray/core/generated/)
-  add_custom_command(
-    TARGET gen_common_python_fbs
-    COMMAND ${FLATBUFFERS_COMPILER} -p -o ${PYTHON_OUTPUT_DIR} ${COMMON_FBS_SRC}
-    DEPENDS ${FBS_DEPENDS}
-    COMMENT "Running flatc compiler on ${COMMON_FBS_SRC}"
-    VERBATIM)
-
-  # Encode the fact that the ray redis module requires the autogenerated
-  # flatbuffer files to compile.
-  add_dependencies(ray_redis_module gen_common_python_fbs)
-
-  add_dependencies(gen_common_python_fbs flatbuffers_ep)
-endif()
-
-if ("${CMAKE_RAY_LANG_JAVA}" STREQUAL "YES")
-  add_custom_target(gen_common_java_fbs DEPENDS ${COMMON_FBS_OUTPUT_FILES})
-
-  # Generate Java bindings for the flatbuffers objects.
-  set(JAVA_OUTPUT_DIR ${CMAKE_BINARY_DIR}/generated/java)
-  add_custom_command(
-    TARGET gen_common_java_fbs
-    COMMAND ${FLATBUFFERS_COMPILER} -j -o ${JAVA_OUTPUT_DIR} ${COMMON_FBS_SRC}
-    DEPENDS ${FBS_DEPENDS}
-    COMMENT "Running flatc compiler on ${COMMON_FBS_SRC}"
-    VERBATIM)
-
-  # Encode the fact that the ray redis module requires the autogenerated
-  # flatbuffer files to compile.
-  add_dependencies(ray_redis_module gen_common_java_fbs)
-
-  add_dependencies(gen_common_java_fbs flatbuffers_ep)
-endif()
-
-add_custom_target(
-   hiredis
-   COMMAND make
-   WORKING_DIRECTORY ${CMAKE_CURRENT_LIST_DIR}/thirdparty/hiredis)
-
-add_library(common STATIC
-  event_loop.cc
-  common.cc
-  common_protocol.cc
-  task.cc
-  io.cc
-  net.cc
-  logging.cc
-  state/redis.cc
-  state/table.cc
-  state/object_table.cc
-  state/task_table.cc
-  state/db_client_table.cc
-  state/driver_table.cc
-  state/actor_notification_table.cc
-  state/local_scheduler_table.cc
-  state/error_table.cc
-  thirdparty/ae/ae.c
-  thirdparty/sha256.c)
-
-add_dependencies(common arrow)
-
-if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
-  add_dependencies(common gen_common_python_fbs)
-endif()
-
-if ("${CMAKE_RAY_LANG_JAVA}" STREQUAL "YES")
-  add_dependencies(common gen_common_java_fbs)
-endif()
-
-target_link_libraries(common "${CMAKE_CURRENT_LIST_DIR}/thirdparty/hiredis/libhiredis.a")
-
-function(define_test test_name library)
-  add_executable(${test_name} test/${test_name}.cc ${ARGN})
-  add_dependencies(${test_name} hiredis flatbuffers_ep)
-  target_link_libraries(${test_name} common ${FLATBUFFERS_STATIC_LIB} ray_static ${PLASMA_STATIC_LIB} ${ARROW_STATIC_LIB} ${library} -lpthread)
-  target_compile_options(${test_name} PUBLIC "-DPLASMA_TEST -DLOCAL_SCHEDULER_TEST -DCOMMON_TEST -DRAY_COMMON_LOG_LEVEL=4")
-endfunction()
-
-define_test(db_tests "")
-define_test(io_tests "")
-define_test(task_tests "")
-define_test(redis_tests "")
-define_test(task_table_tests "")
-define_test(object_table_tests "")
-
-add_custom_target(copy_redis ALL)
-foreach(file "redis-cli" "redis-server")
-add_custom_command(TARGET copy_redis POST_BUILD
-                   COMMAND ${CMAKE_COMMAND} -E
-                      copy ${CMAKE_CURRENT_LIST_DIR}/../../thirdparty/pkg/redis/src/${file}
-                           ${CMAKE_BINARY_DIR}/src/common/thirdparty/redis/src/${file})
-endforeach()
diff --git a/src/common/common.cc b/src/common/common.cc
deleted file mode 100644
index 0a6da6a2936e8..0000000000000
--- a/src/common/common.cc
+++ /dev/null
@@ -1,20 +0,0 @@
-#include "common.h"
-
-#include <chrono>
-#include <stdio.h>
-#include <unistd.h>
-#include <sys/types.h>
-#include <sys/stat.h>
-#include <fcntl.h>
-
-#include "io.h"
-#include <functional>
-
-const unsigned char NIL_DIGEST[DIGEST_SIZE] = {0};
-
-int64_t current_time_ms() {
-  std::chrono::milliseconds ms_since_epoch =
-      std::chrono::duration_cast<std::chrono::milliseconds>(
-          std::chrono::steady_clock::now().time_since_epoch());
-  return ms_since_epoch.count();
-}
diff --git a/src/common/common.h b/src/common/common.h
deleted file mode 100644
index f95bfcca5d262..0000000000000
--- a/src/common/common.h
+++ /dev/null
@@ -1,75 +0,0 @@
-#ifndef COMMON_H
-#define COMMON_H
-
-#include <stdio.h>
-#include <stdlib.h>
-#include <string.h>
-#ifndef __STDC_FORMAT_MACROS
-#define __STDC_FORMAT_MACROS
-#endif
-#include <errno.h>
-#include <inttypes.h>
-#ifndef _WIN32
-#include <execinfo.h>
-#endif
-
-#ifdef __cplusplus
-#include <functional>
-extern "C" {
-#endif
-#include "sha256.h"
-#ifdef __cplusplus
-}
-#endif
-
-#include "arrow/util/macros.h"
-#include "plasma/common.h"
-#include "ray/id.h"
-#include "ray/util/logging.h"
-
-#include "state/ray_config.h"
-
-/** Definitions for Ray logging levels. */
-#define RAY_COMMON_DEBUG 0
-#define RAY_COMMON_INFO 1
-#define RAY_COMMON_WARNING 2
-#define RAY_COMMON_ERROR 3
-#define RAY_COMMON_FATAL 4
-
-/**
- * RAY_COMMON_LOG_LEVEL should be defined to one of the above logging level
- * integer values. Any logging statement in the code with a logging level
- * greater than or equal to RAY_COMMON_LOG_LEVEL will be outputted to stderr.
- * The default logging level is INFO. */
-#ifndef RAY_COMMON_LOG_LEVEL
-#define RAY_COMMON_LOG_LEVEL RAY_COMMON_INFO
-#endif
-
-/* These are exit codes for common errors that can occur in Ray components. */
-#define EXIT_COULD_NOT_BIND_PORT -2
-
-/** This macro indicates that this pointer owns the data it is pointing to
- *  and is responsible for freeing it. */
-#define OWNER
-
-/** The worker ID is the ID of a worker or driver. */
-typedef ray::UniqueID WorkerID;
-
-typedef ray::UniqueID DBClientID;
-
-#define MAX(x, y) ((x) >= (y) ? (x) : (y))
-#define MIN(x, y) ((x) <= (y) ? (x) : (y))
-
-/** Definitions for computing hash digests. */
-#define DIGEST_SIZE SHA256_BLOCK_SIZE
-
-extern const unsigned char NIL_DIGEST[DIGEST_SIZE];
-
-/**
- * Return the current time in milliseconds since the Unix epoch.
- *
- * @return The number of milliseconds since the Unix epoch.
- */
-int64_t current_time_ms();
-
-#endif
diff --git a/src/common/doc/tasks.md b/src/common/doc/tasks.md
deleted file mode 100644
index 4431afae2ee9e..0000000000000
--- a/src/common/doc/tasks.md
+++ /dev/null
@@ -1,32 +0,0 @@
-# Task specifications, task instances and task logs
-
-A *task specification* contains all information that is needed for computing
-the results of a task:
-
-- The ID of the task
-- The function ID of the function that executes the task
-- The arguments (either object IDs for pass by reference
-or values for pass by value)
-- The IDs of the result objects
-
-From these, a task ID can be computed which is also stored in the task
-specification.
-
-A *task* represents the execution of a task specification.
-It consists of:
-
-- A scheduling state (WAITING, SCHEDULED, RUNNING, DONE)
-- The target node where the task is scheduled or executed
-- The task specification
-
-The task data structures are defined in `common/task.h`.
-
-The *task table* is a mapping from the task ID to the *task* information. It is
-updated by various parts of the system:
-
-1. The local scheduler writes it with status WAITING when submits a task to the global scheduler
-2. The global scheduler appends an update WAITING -> SCHEDULED together with the node ID when assigning the task to a local scheduler
-3. The local scheduler appends an update SCHEDULED -> RUNNING when it assigns a task to a worker
-4. The local scheduler appends an update RUNNING -> DONE when the task finishes execution
-
-The task table is defined in `common/state/task_table.h`.
diff --git a/src/common/event_loop.cc b/src/common/event_loop.cc
deleted file mode 100644
index e3d9cc4a2dc6f..0000000000000
--- a/src/common/event_loop.cc
+++ /dev/null
@@ -1,63 +0,0 @@
-#include "event_loop.h"
-
-#include "common.h"
-#include <errno.h>
-
-#define INITIAL_EVENT_LOOP_SIZE 1024
-
-event_loop *event_loop_create(void) {
-  return aeCreateEventLoop(INITIAL_EVENT_LOOP_SIZE);
-}
-
-void event_loop_destroy(event_loop *loop) {
-  /* Clean up timer events. This is to make valgrind happy. */
-  aeTimeEvent *te = loop->timeEventHead;
-  while (te) {
-    aeTimeEvent *next = te->next;
-    free(te);
-    te = next;
-  }
-  aeDeleteEventLoop(loop);
-}
-
-bool event_loop_add_file(event_loop *loop,
-                         int fd,
-                         int events,
-                         event_loop_file_handler handler,
-                         void *context) {
-  /* Try to add the file descriptor. */
-  int err = aeCreateFileEvent(loop, fd, events, handler, context);
-  /* If it cannot be added, increase the size of the event loop. */
-  if (err == AE_ERR && errno == ERANGE) {
-    err = aeResizeSetSize(loop, 3 * aeGetSetSize(loop) / 2);
-    if (err != AE_OK) {
-      return false;
-    }
-    err = aeCreateFileEvent(loop, fd, events, handler, context);
-  }
-  /* In any case, test if there were errors. */
-  return (err == AE_OK);
-}
-
-void event_loop_remove_file(event_loop *loop, int fd) {
-  aeDeleteFileEvent(loop, fd, EVENT_LOOP_READ | EVENT_LOOP_WRITE);
-}
-
-int64_t event_loop_add_timer(event_loop *loop,
-                             int64_t timeout,
-                             event_loop_timer_handler handler,
-                             void *context) {
-  return aeCreateTimeEvent(loop, timeout, handler, context, NULL);
-}
-
-int event_loop_remove_timer(event_loop *loop, int64_t id) {
-  return aeDeleteTimeEvent(loop, id);
-}
-
-void event_loop_run(event_loop *loop) {
-  aeMain(loop);
-}
-
-void event_loop_stop(event_loop *loop) {
-  aeStop(loop);
-}
diff --git a/src/common/event_loop.h b/src/common/event_loop.h
deleted file mode 100644
index e489ab4fb6729..0000000000000
--- a/src/common/event_loop.h
+++ /dev/null
@@ -1,103 +0,0 @@
-#ifndef EVENT_LOOP_H
-#define EVENT_LOOP_H
-
-#include <stdint.h>
-
-extern "C" {
-#ifdef _WIN32
-/* Quirks mean that Windows version needs to be included differently */
-#include <hiredis/hiredis.h>
-#include <ae.h>
-#else
-#include "ae/ae.h"
-#endif
-}
-
-/* Unique timer ID that will be generated when the timer is added to the
- * event loop. Will not be reused later on in another call
- * to event_loop_add_timer. */
-typedef long long timer_id;
-
-typedef aeEventLoop event_loop;
-
-/* File descriptor is readable. */
-#define EVENT_LOOP_READ AE_READABLE
-
-/* File descriptor is writable. */
-#define EVENT_LOOP_WRITE AE_WRITABLE
-
-/* Constant specifying that the timer is done and it will be removed. */
-#define EVENT_LOOP_TIMER_DONE AE_NOMORE
-
-/* Signature of the handler that will be called when there is a new event
- * on the file descriptor that this handler has been registered for. The
- * context is the one that was passed into add_file by the user. The
- * events parameter indicates which event is available on the file,
- * it can be EVENT_LOOP_READ or EVENT_LOOP_WRITE. */
-typedef void (*event_loop_file_handler)(event_loop *loop,
-                                        int fd,
-                                        void *context,
-                                        int events);
-
-/* This handler will be called when a timer times out. The id of the timer
- * as well as the context that was specified when registering this handler
- * are passed as arguments. The return is the number of milliseconds the
- * timer shall be reset to or EVENT_LOOP_TIMER_DONE if the timer shall
- * not be triggered again. */
-typedef int (*event_loop_timer_handler)(event_loop *loop,
-                                        timer_id timer_id,
-                                        void *context);
-
-/* Create and return a new event loop. */
-event_loop *event_loop_create(void);
-
-/* Deallocate space associated with the event loop that was created
- * with the "create" function. */
-void event_loop_destroy(event_loop *loop);
-
-/* Register a handler that will be called any time a new event happens on
- * a file descriptor. Can specify a context that will be passed as an
- * argument to the handler. Currently there can only be one handler per file.
- * The events parameter specifies which events we listen to: EVENT_LOOP_READ
- * or EVENT_LOOP_WRITE. */
-bool event_loop_add_file(event_loop *loop,
-                         int fd,
-                         int events,
-                         event_loop_file_handler handler,
-                         void *context);
-
-/* Remove a registered file event handler from the event loop. */
-void event_loop_remove_file(event_loop *loop, int fd);
-
-/** Register a handler that will be called after a time slice of
- *  "timeout" milliseconds.
- *
- *  @param loop The event loop.
- *  @param timeout The timeout in milliseconds.
- *  @param handler The handler for the timeout.
- *  @param context User context that can be passed in and will be passed in
- *         as an argument for the timer handler.
- *  @return The ID of the timer.
- */
-int64_t event_loop_add_timer(event_loop *loop,
-                             int64_t timeout,
-                             event_loop_timer_handler handler,
-                             void *context);
-
-/**
- * Remove a registered time event handler from the event loop. Can be called
- * multiple times on the same timer.
- *
- * @param loop The event loop.
- * @param timer_id The ID of the timer to be removed.
- * @return Returns 0 if the removal was successful.
- */
-int event_loop_remove_timer(event_loop *loop, int64_t timer_id);
-
-/* Run the event loop. */
-void event_loop_run(event_loop *loop);
-
-/* Stop the event loop. */
-void event_loop_stop(event_loop *loop);
-
-#endif
diff --git a/src/common/format/common.fbs b/src/common/format/common.fbs
deleted file mode 100644
index 9dc9f651a3e32..0000000000000
--- a/src/common/format/common.fbs
+++ /dev/null
@@ -1,200 +0,0 @@
-
-// Indices into resource vectors.
-// A resource vector maps a resource index to the number
-// of units of that resource required.
-
-table Arg {
-  // Object ID for pass-by-reference arguments. Normally there is only one
-  // object ID in this list which represents the object that is being passed.
-  // However to support reducers in a MapReduce workload, we also support
-  // passing multiple object IDs for each argument.
-  object_ids: [string];
-  // Data for pass-by-value arguments.
-  data: string;
-}
-
-table ResourcePair {
-  // The name of the resource.
-  key: string;
-  // The quantity of the resource.
-  value: double;
-}
-
-// NOTE: This enum is duplicate with the `Language` enum in `gcs.fbs`,
-// because we cannot include this file in `gcs.fbs` due to cyclic dependency.
-// TODO(raulchen): remove it once we get rid of legacy ray.
-enum TaskLanguage:int {
-  PYTHON = 0,
-  JAVA = 1
-}
-
-table TaskInfo {
-  // ID of the driver that created this task.
-  driver_id: string;
-  // Task ID of the task.
-  task_id: string;
-  // Task ID of the parent task.
-  parent_task_id: string;
-  // A count of the number of tasks submitted by the parent task before this one.
-  parent_counter: int;
-  // The ID of the actor to create if this is an actor creation task.
-  actor_creation_id: string;
-  // The dummy object ID of the actor creation task if this is an actor method.
-  actor_creation_dummy_object_id: string;
-  // Actor ID of the task. This is the actor that this task is executed on
-  // or NIL_ACTOR_ID if the task is just a normal task.
-  actor_id: string;
-  // The ID of the handle that was used to submit the task. This should be
-  // unique across handles with the same actor_id.
-  actor_handle_id: string;
-  // Number of tasks that have been submitted to this actor so far.
-  actor_counter: int;
-  // True if this task is an actor checkpoint task and false otherwise.
-  is_actor_checkpoint_method: bool;
-  // Function ID of the task.
-  function_id: string;
-  // Task arguments.
-  args: [Arg];
-  // Object IDs of return values.
-  returns: [string];
-  // The required_resources vector indicates the quantities of the different
-  // resources required by this task.
-  required_resources: [ResourcePair];
-  // The language that this task belongs to
-  language: TaskLanguage;
-  // Function descriptor, which is a list of strings that can
-  // uniquely describe a function.
-  // For a Python function, it should be: [module_name, class_name, function_name]
-  // For a Java function, it should be: [class_name, method_name, type_descriptor]
-  // TODO(hchen): after changing Python worker to use function_descriptor,
-  // function_id can be removed.
-  function_descriptor: [string];
-}
-
-// Object information data structure.
-// NOTE(pcm): This structure is replicated in
-// https://github.com/apache/arrow/blob/master/cpp/src/plasma/format/common.fbs,
-// so if you modify it, you should also modify that one.
-table ObjectInfo {
-  // Object ID of this object.
-  object_id: string;
-  // Number of bytes the content of this object occupies in memory.
-  data_size: long;
-  // Number of bytes the metadata of this object occupies in memory.
-  metadata_size: long;
-  // Number of clients using the objects.
-  ref_count: int;
-  // Unix epoch of when this object was created.
-  create_time: long;
-  // How long creation of this object took.
-  construct_duration: long;
-  // Hash of the object content. If the object is not sealed yet this is
-  // an empty string.
-  digest: string;
-  // Specifies if this object was deleted or added.
-  is_deletion: bool;
-}
-
-root_type TaskInfo;
-
-table TaskExecutionDependencies {
-  // A list of object IDs representing this task's dependencies at execution
-  // time.
-  execution_dependencies: [string];
-}
-
-root_type TaskExecutionDependencies;
-
-table SubscribeToNotificationsReply {
-  // The object ID of the object that the notification is about.
-  object_id: string;
-  // The size of the object.
-  object_size: long;
-  // The IDs of the managers that contain this object.
-  manager_ids: [string];
-}
-
-root_type SubscribeToNotificationsReply;
-
-table TaskReply {
-  // The task ID of the task that the message is about.
-  task_id: string;
-  // The state of the task. This is encoded as a bit mask of scheduling_state
-  // enum values in task.h.
-  state: long;
-  // A local scheduler ID.
-  local_scheduler_id: string;
-  // A string of bytes representing the task's TaskExecutionDependencies.
-  execution_dependencies: string;
-  // A string of bytes representing the task specification.
-  task_spec: string;
-  // The number of times the task was spilled back by local schedulers.
-  spillback_count: long;
-  // A boolean representing whether the update was successful. This field
-  // should only be used for test-and-set operations.
-  updated: bool;
-}
-
-root_type TaskReply;
-
-table SubscribeToDBClientTableReply {
-  // The db client ID of the client that the message is about.
-  db_client_id: string;
-  // The type of the client.
-  client_type: string;
-  // If the client is a local scheduler, this is the address of the plasma
-  // manager that the local scheduler is connected to. Otherwise, it is empty.
-  manager_address: string;
-  // True if the message is about the addition of a client and false if it is
-  // about the deletion of a client.
-  is_insertion: bool;
-}
-
-root_type SubscribeToDBClientTableReply;
-
-table LocalSchedulerInfoMessage {
-  // The db client ID of the client that the message is about.
-  db_client_id: string;
-  // The total number of workers that are connected to this local scheduler.
-  total_num_workers: long;
-  // The number of tasks queued in this local scheduler.
-  task_queue_length: long;
-  // The number of workers that are available and waiting for tasks.
-  available_workers: long;
-  // The resources generally available to this local scheduler.
-  static_resources: [ResourcePair];
-  // The resources currently available to this local scheduler.
-  dynamic_resources: [ResourcePair];
-  // Whether the local scheduler is dead. If true, then all other fields
-  // besides `db_client_id` will not be set.
-  is_dead: bool;
-}
-
-root_type LocalSchedulerInfoMessage;
-
-table ResultTableReply {
-  // The task ID of the task that created the object.
-  task_id: string;
-  // Whether the task created the object through a ray.put.
-  is_put: bool;
-  // The size of the object created.
-  data_size: long;
-  // The hash of the object created.
-  hash: string;
-}
-
-root_type ResultTableReply;
-
-table DriverTableMessage {
-  // The driver ID of the driver that died.
-  driver_id: string;
-}
-
-table ActorCreationNotification {
-  // The ID of the actor that was created.
-  actor_id: string;
-  // The ID of the driver that created the actor.
-  driver_id: string;
-  // The ID of the local scheduler that created the actor.
-  local_scheduler_id: string;
-}
diff --git a/src/common/io.cc b/src/common/io.cc
deleted file mode 100644
index 1999b70546694..0000000000000
--- a/src/common/io.cc
+++ /dev/null
@@ -1,416 +0,0 @@
-#include "io.h"
-
-#include <stdlib.h>
-#include <unistd.h>
-#include <sys/socket.h>
-#include <sys/un.h>
-#include <string.h>
-#include <stdio.h>
-#include <inttypes.h>
-#include <stdarg.h>
-#include <sys/ioctl.h>
-#include <netinet/in.h>
-#include <netdb.h>
-
-#include "common.h"
-#include "event_loop.h"
-
-#ifndef _WIN32
-/* This function is actually not declared in standard POSIX, so declare it. */
-extern int usleep(useconds_t usec);
-#endif
-
-int bind_inet_sock(const int port, bool shall_listen) {
-  struct sockaddr_in name;
-  int socket_fd = socket(PF_INET, SOCK_STREAM, 0);
-  if (socket_fd < 0) {
-    RAY_LOG(ERROR) << "socket() failed for port " << port;
-    return -1;
-  }
-  name.sin_family = AF_INET;
-  name.sin_port = htons(port);
-  name.sin_addr.s_addr = htonl(INADDR_ANY);
-  int on = 1;
-  /* TODO(pcm): http://stackoverflow.com/q/1150635 */
-  if (ioctl(socket_fd, FIONBIO, (char *) &on) < 0) {
-    RAY_LOG(ERROR) << "ioctl failed";
-    close(socket_fd);
-    return -1;
-  }
-  int *const pon = (int *const) & on;
-  if (setsockopt(socket_fd, SOL_SOCKET, SO_REUSEADDR, pon, sizeof(on)) < 0) {
-    RAY_LOG(ERROR) << "setsockopt failed for port " << port;
-    close(socket_fd);
-    return -1;
-  }
-  if (bind(socket_fd, (struct sockaddr *) &name, sizeof(name)) < 0) {
-    RAY_LOG(ERROR) << "Bind failed for port " << port;
-    close(socket_fd);
-    return -1;
-  }
-  if (shall_listen && listen(socket_fd, 128) == -1) {
-    RAY_LOG(ERROR) << "Could not listen to socket " << port;
-    close(socket_fd);
-    return -1;
-  }
-  return socket_fd;
-}
-
-int bind_ipc_sock(const char *socket_pathname, bool shall_listen) {
-  struct sockaddr_un socket_address;
-  int socket_fd = socket(AF_UNIX, SOCK_STREAM, 0);
-  if (socket_fd < 0) {
-    RAY_LOG(ERROR) << "socket() failed for pathname " << socket_pathname;
-    return -1;
-  }
-  /* Tell the system to allow the port to be reused. */
-  int on = 1;
-  if (setsockopt(socket_fd, SOL_SOCKET, SO_REUSEADDR, (char *) &on,
-                 sizeof(on)) < 0) {
-    RAY_LOG(ERROR) << "setsockopt failed for pathname " << socket_pathname;
-    close(socket_fd);
-    return -1;
-  }
-
-  unlink(socket_pathname);
-  memset(&socket_address, 0, sizeof(socket_address));
-  socket_address.sun_family = AF_UNIX;
-  if (strlen(socket_pathname) + 1 > sizeof(socket_address.sun_path)) {
-    RAY_LOG(ERROR) << "Socket pathname is too long.";
-    close(socket_fd);
-    return -1;
-  }
-  strncpy(socket_address.sun_path, socket_pathname,
-          strlen(socket_pathname) + 1);
-
-  if (bind(socket_fd, (struct sockaddr *) &socket_address,
-           sizeof(socket_address)) != 0) {
-    RAY_LOG(ERROR) << "Bind failed for pathname " << socket_pathname;
-    close(socket_fd);
-    return -1;
-  }
-  if (shall_listen && listen(socket_fd, 128) == -1) {
-    RAY_LOG(ERROR) << "Could not listen to socket " << socket_pathname;
-    close(socket_fd);
-    return -1;
-  }
-  return socket_fd;
-}
-
-int connect_ipc_sock_retry(const char *socket_pathname,
-                           int num_retries,
-                           int64_t timeout) {
-  /* Pick the default values if the user did not specify. */
-  if (num_retries < 0) {
-    num_retries = RayConfig::instance().num_connect_attempts();
-  }
-  if (timeout < 0) {
-    timeout = RayConfig::instance().connect_timeout_milliseconds();
-  }
-
-  RAY_CHECK(socket_pathname);
-  int fd = -1;
-  for (int num_attempts = 0; num_attempts < num_retries; ++num_attempts) {
-    fd = connect_ipc_sock(socket_pathname);
-    if (fd >= 0) {
-      break;
-    }
-    if (num_attempts == 0) {
-      RAY_LOG(ERROR) << "Connection to socket failed for pathname "
-                     << socket_pathname;
-    }
-    /* Sleep for timeout milliseconds. */
-    usleep(timeout * 1000);
-  }
-  /* If we could not connect to the socket, exit. */
-  if (fd == -1) {
-    RAY_LOG(FATAL) << "Could not connect to socket " << socket_pathname;
-  }
-  return fd;
-}
-
-int connect_ipc_sock(const char *socket_pathname) {
-  struct sockaddr_un socket_address;
-  int socket_fd;
-
-  socket_fd = socket(AF_UNIX, SOCK_STREAM, 0);
-  if (socket_fd < 0) {
-    RAY_LOG(ERROR) << "socket() failed for pathname " << socket_pathname;
-    return -1;
-  }
-
-  memset(&socket_address, 0, sizeof(socket_address));
-  socket_address.sun_family = AF_UNIX;
-  if (strlen(socket_pathname) + 1 > sizeof(socket_address.sun_path)) {
-    RAY_LOG(ERROR) << "Socket pathname is too long.";
-    return -1;
-  }
-  strncpy(socket_address.sun_path, socket_pathname,
-          strlen(socket_pathname) + 1);
-
-  if (connect(socket_fd, (struct sockaddr *) &socket_address,
-              sizeof(socket_address)) != 0) {
-    close(socket_fd);
-    return -1;
-  }
-
-  return socket_fd;
-}
-
-int connect_inet_sock_retry(const char *ip_addr,
-                            int port,
-                            int num_retries,
-                            int64_t timeout) {
-  /* Pick the default values if the user did not specify. */
-  if (num_retries < 0) {
-    num_retries = RayConfig::instance().num_connect_attempts();
-  }
-  if (timeout < 0) {
-    timeout = RayConfig::instance().connect_timeout_milliseconds();
-  }
-
-  RAY_CHECK(ip_addr);
-  int fd = -1;
-  for (int num_attempts = 0; num_attempts < num_retries; ++num_attempts) {
-    fd = connect_inet_sock(ip_addr, port);
-    if (fd >= 0) {
-      break;
-    }
-    if (num_attempts == 0) {
-      RAY_LOG(ERROR) << "Connection to socket failed for address " << ip_addr
-                     << ":" << port;
-    }
-    /* Sleep for timeout milliseconds. */
-    usleep(timeout * 1000);
-  }
-  /* If we could not connect to the socket, exit. */
-  if (fd == -1) {
-    RAY_LOG(FATAL) << "Could not connect to address " << ip_addr << ":" << port;
-  }
-  return fd;
-}
-
-int connect_inet_sock(const char *ip_addr, int port) {
-  int fd = socket(PF_INET, SOCK_STREAM, 0);
-  if (fd < 0) {
-    RAY_LOG(ERROR) << "socket() failed for address " << ip_addr << ":" << port;
-    return -1;
-  }
-
-  struct hostent *manager = gethostbyname(ip_addr); /* TODO(pcm): cache this */
-  if (!manager) {
-    RAY_LOG(ERROR) << "Failed to get hostname from address " << ip_addr << ":"
-                   << port;
-    close(fd);
-    return -1;
-  }
-
-  struct sockaddr_in addr;
-  addr.sin_family = AF_INET;
-  memcpy(&addr.sin_addr.s_addr, manager->h_addr_list[0], manager->h_length);
-  addr.sin_port = htons(port);
-
-  if (connect(fd, (struct sockaddr *) &addr, sizeof(addr)) != 0) {
-    close(fd);
-    return -1;
-  }
-  return fd;
-}
-
-int accept_client(int socket_fd) {
-  int client_fd = accept(socket_fd, NULL, NULL);
-  if (client_fd < 0) {
-    RAY_LOG(ERROR) << "Error reading from socket.";
-    return -1;
-  }
-  return client_fd;
-}
-
-int write_bytes(int fd, uint8_t *cursor, size_t length) {
-  ssize_t nbytes = 0;
-  size_t bytesleft = length;
-  size_t offset = 0;
-  while (bytesleft > 0) {
-    /* While we haven't written the whole message, write to the file
-     * descriptor, advance the cursor, and decrease the amount left to write. */
-    nbytes = write(fd, cursor + offset, bytesleft);
-    if (nbytes < 0) {
-      if (errno == EAGAIN || errno == EWOULDBLOCK || errno == EINTR) {
-        continue;
-      }
-      return -1; /* Errno will be set. */
-    } else if (0 == nbytes) {
-      /* Encountered early EOF. */
-      return -1;
-    }
-    RAY_CHECK(nbytes > 0);
-    bytesleft -= nbytes;
-    offset += nbytes;
-  }
-
-  return 0;
-}
-
-int do_write_message(int fd, int64_t type, int64_t length, uint8_t *bytes) {
-  int64_t version = RayConfig::instance().ray_protocol_version();
-  int closed;
-  closed = write_bytes(fd, (uint8_t *) &version, sizeof(version));
-  if (closed) {
-    return closed;
-  }
-  closed = write_bytes(fd, (uint8_t *) &type, sizeof(type));
-  if (closed) {
-    return closed;
-  }
-  closed = write_bytes(fd, (uint8_t *) &length, sizeof(length));
-  if (closed) {
-    return closed;
-  }
-  closed = write_bytes(fd, bytes, length * sizeof(char));
-  if (closed) {
-    return closed;
-  }
-  return 0;
-}
-
-int write_message(int fd,
-                  int64_t type,
-                  int64_t length,
-                  uint8_t *bytes,
-                  std::mutex *mutex) {
-  if (mutex != NULL) {
-    std::unique_lock<std::mutex> guard(*mutex);
-    return do_write_message(fd, type, length, bytes);
-  } else {
-    return do_write_message(fd, type, length, bytes);
-  }
-}
-
-int read_bytes(int fd, uint8_t *cursor, size_t length) {
-  ssize_t nbytes = 0;
-  /* Termination condition: EOF or read 'length' bytes total. */
-  size_t bytesleft = length;
-  size_t offset = 0;
-  while (bytesleft > 0) {
-    nbytes = read(fd, cursor + offset, bytesleft);
-    if (nbytes < 0) {
-      if (errno == EAGAIN || errno == EWOULDBLOCK || errno == EINTR) {
-        continue;
-      }
-      return -1; /* Errno will be set. */
-    } else if (0 == nbytes) {
-      /* Encountered early EOF. */
-      return -1;
-    }
-    RAY_CHECK(nbytes > 0);
-    bytesleft -= nbytes;
-    offset += nbytes;
-  }
-
-  return 0;
-}
-
-void read_message(int fd, int64_t *type, int64_t *length, uint8_t **bytes) {
-  int64_t version;
-  int closed = read_bytes(fd, (uint8_t *) &version, sizeof(version));
-  if (closed) {
-    goto disconnected;
-  }
-  RAY_CHECK(version == RayConfig::instance().ray_protocol_version());
-  closed = read_bytes(fd, (uint8_t *) type, sizeof(*type));
-  if (closed) {
-    goto disconnected;
-  }
-  closed = read_bytes(fd, (uint8_t *) length, sizeof(*length));
-  if (closed) {
-    goto disconnected;
-  }
-  *bytes = (uint8_t *) malloc(*length * sizeof(uint8_t));
-  closed = read_bytes(fd, *bytes, *length);
-  if (closed) {
-    free(*bytes);
-    goto disconnected;
-  }
-  return;
-
-disconnected:
-  /* Handle the case in which the socket is closed. */
-  *type = static_cast<int64_t>(CommonMessageType::DISCONNECT_CLIENT);
-  *length = 0;
-  *bytes = NULL;
-  return;
-}
-
-uint8_t *read_message_async(event_loop *loop, int sock) {
-  int64_t size;
-  int error = read_bytes(sock, (uint8_t *) &size, sizeof(int64_t));
-  if (error < 0) {
-    /* The other side has closed the socket. */
-    RAY_LOG(DEBUG) << "Socket has been closed, or some other error has "
-                   << "occurred.";
-    if (loop != NULL) {
-      event_loop_remove_file(loop, sock);
-    }
-    close(sock);
-    return NULL;
-  }
-  uint8_t *message = (uint8_t *) malloc(size);
-  error = read_bytes(sock, message, size);
-  if (error < 0) {
-    /* The other side has closed the socket. */
-    RAY_LOG(DEBUG) << "Socket has been closed, or some other error has "
-                   << "occurred.";
-    if (loop != NULL) {
-      event_loop_remove_file(loop, sock);
-    }
-    close(sock);
-    return NULL;
-  }
-  return message;
-}
-
-int64_t read_vector(int fd, int64_t *type, std::vector<uint8_t> &buffer) {
-  int64_t version;
-  int closed = read_bytes(fd, (uint8_t *) &version, sizeof(version));
-  if (closed) {
-    goto disconnected;
-  }
-  RAY_CHECK(version == RayConfig::instance().ray_protocol_version());
-  int64_t length;
-  closed = read_bytes(fd, (uint8_t *) type, sizeof(*type));
-  if (closed) {
-    goto disconnected;
-  }
-  closed = read_bytes(fd, (uint8_t *) &length, sizeof(length));
-  if (closed) {
-    goto disconnected;
-  }
-  if (static_cast<size_t>(length) > buffer.size()) {
-    buffer.resize(length);
-  }
-  closed = read_bytes(fd, buffer.data(), length);
-  if (closed) {
-    goto disconnected;
-  }
-  return length;
-disconnected:
-  /* Handle the case in which the socket is closed. */
-  *type = static_cast<int64_t>(CommonMessageType::DISCONNECT_CLIENT);
-  return 0;
-}
-
-void write_log_message(int fd, const char *message) {
-  /* Account for the \0 at the end of the string. */
-  do_write_message(fd, static_cast<int64_t>(CommonMessageType::LOG_MESSAGE),
-                   strlen(message) + 1, (uint8_t *) message);
-}
-
-char *read_log_message(int fd) {
-  uint8_t *bytes;
-  int64_t type;
-  int64_t length;
-  read_message(fd, &type, &length, &bytes);
-  RAY_CHECK(static_cast<CommonMessageType>(type) ==
-            CommonMessageType::LOG_MESSAGE);
-  return (char *) bytes;
-}
diff --git a/src/common/io.h b/src/common/io.h
deleted file mode 100644
index 3f976445aeb05..0000000000000
--- a/src/common/io.h
+++ /dev/null
@@ -1,228 +0,0 @@
-#ifndef IO_H
-#define IO_H
-
-#include <stdint.h>
-#include <stdlib.h>
-
-#include <mutex>
-#include <vector>
-
-struct aeEventLoop;
-typedef aeEventLoop event_loop;
-
-enum class CommonMessageType : int32_t {
-  /** Disconnect a client. */
-  DISCONNECT_CLIENT,
-  /** Log a message from a client. */
-  LOG_MESSAGE,
-  /** Submit a task to the local scheduler. */
-  SUBMIT_TASK,
-};
-
-/* Helper functions for socket communication. */
-
-/**
- * Binds to an Internet socket at the given port. Removes any existing file at
- * the pathname. Returns a non-blocking file descriptor for the socket, or -1
- * if an error occurred.
- *
- * @note Since the returned file descriptor is non-blocking, it is not
- * recommended to use the Linux read and write calls directly, since these
- * might read or write a partial message. Instead, use the provided
- * write_message and read_message methods.
- *
- * @param port The port to bind to.
- * @param shall_listen Are we also starting to listen on the socket?
- * @return A non-blocking file descriptor for the socket, or -1 if an error
- *         occurs.
- */
-int bind_inet_sock(const int port, bool shall_listen);
-
-/**
- * Binds to a Unix domain streaming socket at the given
- * pathname. Removes any existing file at the pathname.
- *
- * @param socket_pathname The pathname for the socket.
- * @param shall_listen Are we also starting to listen on the socket?
- * @return A blocking file descriptor for the socket, or -1 if an error
- *         occurs.
- */
-int bind_ipc_sock(const char *socket_pathname, bool shall_listen);
-
-/**
- * Connect to a Unix domain streaming socket at the given
- * pathname.
- *
- * @param socket_pathname The pathname for the socket.
- * @return A file descriptor for the socket, or -1 if an error occurred.
- */
-int connect_ipc_sock(const char *socket_pathname);
-
-/**
- * Connect to a Unix domain streaming socket at the given
- * pathname, or fail after some number of retries.
- *
- * @param socket_pathname The pathname for the socket.
- * @param num_retries The number of times to retry the connection
- *        before exiting. If -1 is provided, then this defaults to
- *        num_connect_attempts.
- * @param timeout The number of milliseconds to wait in between
- *        retries. If -1 is provided, then this defaults to
- *        connect_timeout_milliseconds.
- * @return A file descriptor for the socket, or -1 if an error occurred.
- */
-int connect_ipc_sock_retry(const char *socket_pathname,
-                           int num_retries,
-                           int64_t timeout);
-
-/**
- * Connect to an Internet socket at the given address and port.
- *
- * @param ip_addr The IP address to connect to.
- * @param port The port number to connect to.
- *
- * @param socket_pathname The pathname for the socket.
- * @return A file descriptor for the socket, or -1 if an error occurred.
- */
-int connect_inet_sock(const char *ip_addr, int port);
-
-/**
- * Connect to an Internet socket at the given address and port, or fail after
- * some number of retries.
- *
- * @param ip_addr The IP address to connect to.
- * @param port The port number to connect to.
- * @param num_retries The number of times to retry the connection
- *        before exiting. If -1 is provided, then this defaults to
- *        num_connect_attempts.
- * @param timeout The number of milliseconds to wait in between
- *        retries. If -1 is provided, then this defaults to
- *        connect_timeout_milliseconds.
- * @return A file descriptor for the socket, or -1 if an error occurred.
- */
-int connect_inet_sock_retry(const char *ip_addr,
-                            int port,
-                            int num_retries,
-                            int64_t timeout);
-
-/**
- * Accept a new client connection on the given socket
- * descriptor. Returns a descriptor for the new socket.
- */
-int accept_client(int socket_fd);
-
-/* Reading and writing data. */
-
-/**
- * Write a sequence of bytes on a file descriptor. The bytes should then be read
- * by read_message.
- *
- * @param fd The file descriptor to write to. It can be non-blocking.
- * @param version The protocol version.
- * @param type The type of the message to send.
- * @param length The size in bytes of the bytes parameter.
- * @param bytes The address of the message to send.
- * @param mutex If not NULL, the whole write operation will be locked
- *        with this mutex, otherwise do nothing.
- * @return int Whether there was an error while writing. 0 corresponds to
- *         success and -1 corresponds to an error (errno will be set).
- */
-int write_message(int fd,
-                  int64_t type,
-                  int64_t length,
-                  uint8_t *bytes,
-                  std::mutex *mutex = NULL);
-
-/**
- * Read a sequence of bytes written by write_message from a file descriptor.
- * This allocates space for the message.
- *
- * @note The caller must free the memory.
- *
- * @param fd The file descriptor to read from. It can be non-blocking.
- * @param type The type of the message that is read will be written at this
- *        address. If there was an error while reading, this will be
- *        DISCONNECT_CLIENT.
- * @param length The size in bytes of the message that is read will be written
- *        at this address. This size does not include the bytes used to encode
- *        the type and length. If there was an error while reading, this will
- *        be 0.
- * @param bytes The address at which to write the pointer to the bytes that are
- *        read and allocated by this function. If there was an error while
- *        reading, this will be NULL.
- * @return Void.
- */
-void read_message(int fd, int64_t *type, int64_t *length, uint8_t **bytes);
-
-/**
- * Read a message from a file descriptor and remove the file descriptor from the
- * event loop if there is an error. This will actually do two reads. The first
- * read reads sizeof(int64_t) bytes to determine the number of bytes to read in
- * the next read.
- *
- * @param loop: The event loop.
- * @param sock: The file descriptor to read from.
- * @return A byte buffer contining the message or NULL if there was an
- *         error. The buffer needs to be freed by the user.
- */
-uint8_t *read_message_async(event_loop *loop, int sock);
-
-/**
- * Read a sequence of bytes written by write_message from a file descriptor.
- * This does not allocate space for the message if the provided buffer is
- * large enough and can therefore often avoid allocations.
- *
- * @param fd The file descriptor to read from. It can be non-blocking.
- * @param type The type of the message that is read will be written at this
- *        address. If there was an error while reading, this will be
- *        DISCONNECT_CLIENT.
- * @param buffer The array the message will be written to. If it is not
- *        large enough to hold the message, it will be enlarged by read_vector.
- * @return Number of bytes of the message that were read. This size does not
- *         include the bytes used to encode the type and length. If there was
- *         an error while reading, this will be 0.
- */
-int64_t read_vector(int fd, int64_t *type, std::vector<uint8_t> &buffer);
-
-/**
- * Write a null-terminated string to a file descriptor.
- */
-void write_log_message(int fd, const char *message);
-
-/**
- * Reads a null-terminated string from the file descriptor that has been
- * written by write_log_message. Allocates and returns a pointer to the string.
- * NOTE: Caller must free the memory!
- */
-char *read_log_message(int fd);
-
-/**
- * Read a sequence of bytes from a file descriptor into a buffer. This will
- * block until one of the following happens: (1) there is an error (2) end of
- * file, or (3) all length bytes have been written.
- *
- * @note The buffer pointed to by cursor must already have length number of
- * bytes allocated before calling this method.
- *
- * @param fd The file descriptor to read from. It can be non-blocking.
- * @param cursor The cursor pointing to the beginning of the buffer.
- * @param length The size of the byte sequence to read.
- * @return int Whether there was an error while reading. 0 corresponds to
- *         success and -1 corresponds to an error (errno will be set).
- */
-int read_bytes(int fd, uint8_t *cursor, size_t length);
-
-/**
- * Write a sequence of bytes into a file descriptor. This will block until one
- * of the following happens: (1) there is an error (2) end of file, or (3) all
- * length bytes have been written.
- *
- * @param fd The file descriptor to write to. It can be non-blocking.
- * @param cursor The cursor pointing to the beginning of the bytes to send.
- * @param length The size of the bytes sequence to write.
- * @return int Whether there was an error while writing. 0 corresponds to
- *         success and -1 corresponds to an error (errno will be set).
- */
-int write_bytes(int fd, uint8_t *cursor, size_t length);
-
-#endif /* IO_H */
diff --git a/src/common/lib/python/common_extension.cc b/src/common/lib/python/common_extension.cc
deleted file mode 100644
index 68965e270980c..0000000000000
--- a/src/common/lib/python/common_extension.cc
+++ /dev/null
@@ -1,919 +0,0 @@
-#include <Python.h>
-#include "bytesobject.h"
-#include "node.h"
-
-// Don't use the deprecated Numpy functions.
-#define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
-
-#include <numpy/arrayobject.h>
-
-#include "common.h"
-#include "common_extension.h"
-#include "common_protocol.h"
-#include "ray/raylet/task.h"
-#include "ray/raylet/task_spec.h"
-#include "ray/raylet/task_execution_spec.h"
-#include "task.h"
-
-#include <string>
-
-#if PY_MAJOR_VERSION >= 3
-#define PyInt_Check PyLong_Check
-#endif
-
-PyObject *CommonError;
-
-/* Initialize pickle module. */
-
-PyObject *pickle_module = NULL;
-PyObject *pickle_loads = NULL;
-PyObject *pickle_dumps = NULL;
-PyObject *pickle_protocol = NULL;
-
-int init_numpy_module(void) {
-  import_array1(-1);
-  return 0;
-}
-
-void init_pickle_module(void) {
-#if PY_MAJOR_VERSION >= 3
-  pickle_module = PyImport_ImportModule("pickle");
-#else
-  pickle_module = PyImport_ImportModuleNoBlock("cPickle");
-#endif
-  RAY_CHECK(pickle_module != NULL);
-  RAY_CHECK(PyObject_HasAttrString(pickle_module, "loads"));
-  RAY_CHECK(PyObject_HasAttrString(pickle_module, "dumps"));
-  RAY_CHECK(PyObject_HasAttrString(pickle_module, "HIGHEST_PROTOCOL"));
-  pickle_loads = PyUnicode_FromString("loads");
-  pickle_dumps = PyUnicode_FromString("dumps");
-  pickle_protocol = PyObject_GetAttrString(pickle_module, "HIGHEST_PROTOCOL");
-  RAY_CHECK(pickle_protocol != NULL);
-}
-
-TaskBuilder *g_task_builder = NULL;
-
-/* Define the PyObjectID class. */
-
-int PyStringToUniqueID(PyObject *object, ObjectID *object_id) {
-  if (PyBytes_Check(object)) {
-    std::memcpy(object_id->mutable_data(), PyBytes_AsString(object),
-                sizeof(*object_id));
-    return 1;
-  } else {
-    PyErr_SetString(PyExc_TypeError, "must be a 20 character string");
-    return 0;
-  }
-}
-
-int PyObjectToUniqueID(PyObject *object, ObjectID *objectid) {
-  if (PyObject_IsInstance(object, (PyObject *) &PyObjectIDType)) {
-    *objectid = ((PyObjectID *) object)->object_id;
-    return 1;
-  } else {
-    PyErr_SetString(PyExc_TypeError, "must be an ObjectID");
-    return 0;
-  }
-}
-
-bool use_raylet(PyTask *task) {
-  return task->spec == nullptr;
-}
-
-static int PyObjectID_init(PyObjectID *self, PyObject *args, PyObject *kwds) {
-  const char *data;
-  int size;
-  if (!PyArg_ParseTuple(args, "s#", &data, &size)) {
-    return -1;
-  }
-  if (size != sizeof(ObjectID)) {
-    PyErr_SetString(CommonError,
-                    "ObjectID: object id string needs to have length 20");
-    return -1;
-  }
-  std::memcpy(self->object_id.mutable_data(), data, sizeof(self->object_id));
-  return 0;
-}
-
-/* Create a PyObjectID from C. */
-PyObject *PyObjectID_make(ObjectID object_id) {
-  PyObjectID *result = PyObject_New(PyObjectID, &PyObjectIDType);
-  result = (PyObjectID *) PyObject_Init((PyObject *) result, &PyObjectIDType);
-  result->object_id = object_id;
-  return (PyObject *) result;
-}
-
-/**
- * Convert a string to a Ray task specification Python object.
- *
- * This is called from Python like
- *
- * task = local_scheduler.task_from_string("...")
- *
- * @param task_string String representation of the task specification.
- * @return Python task specification object.
- */
-PyObject *PyTask_from_string(PyObject *self, PyObject *args) {
-  const char *data;
-  int size;
-  if (!PyArg_ParseTuple(args, "s#", &data, &size)) {
-    return NULL;
-  }
-  PyTask *result = PyObject_New(PyTask, &PyTaskType);
-  result = (PyTask *) PyObject_Init((PyObject *) result, &PyTaskType);
-  result->size = size;
-  result->spec = TaskSpec_copy((TaskSpec *) data, size);
-  /* The created task does not include any execution dependencies. */
-  result->execution_dependencies = new std::vector<ObjectID>();
-  /* TODO(pcm): Use flatbuffers validation here. */
-  return (PyObject *) result;
-}
-
-/**
- * Convert a Ray task specification Python object to a string.
- *
- * This is called from Python like
- *
- * s = local_scheduler.task_to_string(task)
- *
- * @param task Ray task specification Python object.
- * @return String representing the task specification.
- */
-PyObject *PyTask_to_string(PyObject *self, PyObject *args) {
-  PyObject *arg;
-  if (!PyArg_ParseTuple(args, "O", &arg)) {
-    return NULL;
-  }
-  PyTask *task = (PyTask *) arg;
-  if (!use_raylet(task)) {
-    return PyBytes_FromStringAndSize((char *) task->spec, task->size);
-  } else {
-    flatbuffers::FlatBufferBuilder fbb;
-    auto task_spec_string = task->task_spec->ToFlatbuffer(fbb);
-    fbb.Finish(task_spec_string);
-    return PyBytes_FromStringAndSize((char *) fbb.GetBufferPointer(),
-                                     fbb.GetSize());
-  }
-}
-
-static PyObject *PyObjectID_id(PyObject *self) {
-  PyObjectID *s = (PyObjectID *) self;
-  return PyBytes_FromStringAndSize((const char *) s->object_id.data(),
-                                   sizeof(s->object_id));
-}
-
-static PyObject *PyObjectID_hex(PyObject *self) {
-  PyObjectID *s = (PyObjectID *) self;
-  std::string hex_id = s->object_id.hex();
-#if PY_MAJOR_VERSION >= 3
-  PyObject *result = PyUnicode_FromStringAndSize(hex_id.data(), hex_id.size());
-#else
-  PyObject *result = PyBytes_FromStringAndSize(hex_id.data(), hex_id.size());
-#endif
-  return result;
-}
-
-static PyObject *PyObjectID_richcompare(PyObjectID *self,
-                                        PyObject *other,
-                                        int op) {
-  PyObject *result = NULL;
-  if (Py_TYPE(self)->tp_richcompare != Py_TYPE(other)->tp_richcompare) {
-    result = Py_NotImplemented;
-  } else {
-    PyObjectID *other_id = (PyObjectID *) other;
-    switch (op) {
-    case Py_LT:
-      result = Py_NotImplemented;
-      break;
-    case Py_LE:
-      result = Py_NotImplemented;
-      break;
-    case Py_EQ:
-      result = self->object_id == other_id->object_id ? Py_True : Py_False;
-      break;
-    case Py_NE:
-      result = !(self->object_id == other_id->object_id) ? Py_True : Py_False;
-      break;
-    case Py_GT:
-      result = Py_NotImplemented;
-      break;
-    case Py_GE:
-      result = Py_NotImplemented;
-      break;
-    }
-  }
-  Py_XINCREF(result);
-  return result;
-}
-
-static PyObject *PyObjectID_redis_shard_hash(PyObjectID *self) {
-  /* NOTE: The hash function used here must match the one in get_redis_context
-   * in src/common/state/redis.cc. Changes to the hash function should only be
-   * made through std::hash in src/common/common.h */
-  std::hash<ray::UniqueID> hash;
-  return PyLong_FromSize_t(hash(self->object_id));
-}
-
-static long PyObjectID_hash(PyObjectID *self) {
-  // TODO(pcm): Replace this with a faster hash function. This currently
-  // creates a tuple of length 20 and hashes it, which is slow
-  PyObject *tuple = PyTuple_New(kUniqueIDSize);
-  for (int i = 0; i < kUniqueIDSize; ++i) {
-    PyTuple_SetItem(tuple, i, PyLong_FromLong(self->object_id.data()[i]));
-  }
-  long hash = PyObject_Hash(tuple);
-  Py_XDECREF(tuple);
-  return hash;
-}
-
-static PyObject *PyObjectID_repr(PyObjectID *self) {
-  std::string repr = "ObjectID(" + self->object_id.hex() + ")";
-  PyObject *result = PyUnicode_FromString(repr.c_str());
-  return result;
-}
-
-static PyObject *PyObjectID___reduce__(PyObjectID *self) {
-  PyErr_SetString(CommonError, "ObjectID objects cannot be serialized.");
-  return NULL;
-}
-
-static PyMethodDef PyObjectID_methods[] = {
-    {"id", (PyCFunction) PyObjectID_id, METH_NOARGS,
-     "Return the hash associated with this ObjectID"},
-    {"redis_shard_hash", (PyCFunction) PyObjectID_redis_shard_hash, METH_NOARGS,
-     "Return the redis shard that this ObjectID is associated with"},
-    {"hex", (PyCFunction) PyObjectID_hex, METH_NOARGS,
-     "Return the object ID as a string in hex."},
-    {"__reduce__", (PyCFunction) PyObjectID___reduce__, METH_NOARGS,
-     "Say how to pickle this ObjectID. This raises an exception to prevent"
-     "object IDs from being serialized."},
-    {NULL} /* Sentinel */
-};
-
-static PyMemberDef PyObjectID_members[] = {
-    {NULL} /* Sentinel */
-};
-
-PyTypeObject PyObjectIDType = {
-    PyVarObject_HEAD_INIT(NULL, 0)        /* ob_size */
-    "common.ObjectID",                    /* tp_name */
-    sizeof(PyObjectID),                   /* tp_basicsize */
-    0,                                    /* tp_itemsize */
-    0,                                    /* tp_dealloc */
-    0,                                    /* tp_print */
-    0,                                    /* tp_getattr */
-    0,                                    /* tp_setattr */
-    0,                                    /* tp_compare */
-    (reprfunc) PyObjectID_repr,           /* tp_repr */
-    0,                                    /* tp_as_number */
-    0,                                    /* tp_as_sequence */
-    0,                                    /* tp_as_mapping */
-    (hashfunc) PyObjectID_hash,           /* tp_hash */
-    0,                                    /* tp_call */
-    0,                                    /* tp_str */
-    0,                                    /* tp_getattro */
-    0,                                    /* tp_setattro */
-    0,                                    /* tp_as_buffer */
-    Py_TPFLAGS_DEFAULT,                   /* tp_flags */
-    "ObjectID object",                    /* tp_doc */
-    0,                                    /* tp_traverse */
-    0,                                    /* tp_clear */
-    (richcmpfunc) PyObjectID_richcompare, /* tp_richcompare */
-    0,                                    /* tp_weaklistoffset */
-    0,                                    /* tp_iter */
-    0,                                    /* tp_iternext */
-    PyObjectID_methods,                   /* tp_methods */
-    PyObjectID_members,                   /* tp_members */
-    0,                                    /* tp_getset */
-    0,                                    /* tp_base */
-    0,                                    /* tp_dict */
-    0,                                    /* tp_descr_get */
-    0,                                    /* tp_descr_set */
-    0,                                    /* tp_dictoffset */
-    (initproc) PyObjectID_init,           /* tp_init */
-    0,                                    /* tp_alloc */
-    PyType_GenericNew,                    /* tp_new */
-};
-
-/* Define the PyTask class. */
-
-static int PyTask_init(PyTask *self, PyObject *args, PyObject *kwds) {
-  /* ID of the driver that this task originates from. */
-  UniqueID driver_id;
-  /* ID of the actor this task should run on. */
-  UniqueID actor_id = ActorID::nil();
-  /* ID of the actor handle used to submit this task. */
-  UniqueID actor_handle_id = ActorHandleID::nil();
-  /* How many tasks have been launched on the actor so far? */
-  int actor_counter = 0;
-  /* True if this is an actor checkpoint task and false otherwise. */
-  PyObject *is_actor_checkpoint_method_object = nullptr;
-  /* ID of the function this task executes. */
-  FunctionID function_id;
-  /* Arguments of the task (can be PyObjectIDs or Python values). */
-  PyObject *arguments;
-  /* Number of return values of this task. */
-  int num_returns;
-  /* The ID of the task that called this task. */
-  TaskID parent_task_id;
-  /* The number of tasks that the parent task has called prior to this one. */
-  int parent_counter;
-  // The actor creation ID.
-  ActorID actor_creation_id = ActorID::nil();
-  // The dummy object for the actor creation task (if this is an actor method).
-  ObjectID actor_creation_dummy_object_id = ObjectID::nil();
-  /* Arguments of the task that are execution-dependent. These must be
-   * PyObjectIDs). */
-  PyObject *execution_arguments = nullptr;
-  /* Dictionary of resource requirements for this task. */
-  PyObject *resource_map = nullptr;
-  // True if we should use the raylet code path and false otherwise.
-  PyObject *use_raylet_object = nullptr;
-  if (!PyArg_ParseTuple(
-          args, "O&O&OiO&i|O&O&O&O&iOOOO", &PyObjectToUniqueID, &driver_id,
-          &PyObjectToUniqueID, &function_id, &arguments, &num_returns,
-          &PyObjectToUniqueID, &parent_task_id, &parent_counter,
-          &PyObjectToUniqueID, &actor_creation_id, &PyObjectToUniqueID,
-          &actor_creation_dummy_object_id, &PyObjectToUniqueID, &actor_id,
-          &PyObjectToUniqueID, &actor_handle_id, &actor_counter,
-          &is_actor_checkpoint_method_object, &execution_arguments,
-          &resource_map, &use_raylet_object)) {
-    return -1;
-  }
-
-  bool is_actor_checkpoint_method = false;
-  if (is_actor_checkpoint_method_object != nullptr &&
-      PyObject_IsTrue(is_actor_checkpoint_method_object) == 1) {
-    is_actor_checkpoint_method = true;
-  }
-
-  // Parse the resource map.
-  std::unordered_map<std::string, double> required_resources;
-
-  bool found_CPU_requirements = false;
-  PyObject *key, *value;
-  Py_ssize_t position = 0;
-  if (resource_map != nullptr) {
-    if (!PyDict_Check(resource_map)) {
-      PyErr_SetString(PyExc_TypeError, "resource_map must be a dictionary");
-      return -1;
-    }
-    while (PyDict_Next(resource_map, &position, &key, &value)) {
-      if (!(PyBytes_Check(key) || PyUnicode_Check(key))) {
-        PyErr_SetString(PyExc_TypeError,
-                        "the keys in resource_map must be strings");
-        return -1;
-      }
-      if (!(PyFloat_Check(value) || PyInt_Check(value) ||
-            PyLong_Check(value))) {
-        PyErr_SetString(PyExc_TypeError,
-                        "the values in resource_map must be floats");
-        return -1;
-      }
-      // Handle the case where the key is a bytes object and the case where it
-      // is a unicode object.
-      std::string resource_name;
-      if (PyUnicode_Check(key)) {
-        PyObject *ascii_key = PyUnicode_AsASCIIString(key);
-        resource_name =
-            std::string(PyBytes_AsString(ascii_key), PyBytes_Size(ascii_key));
-        Py_DECREF(ascii_key);
-      } else {
-        resource_name = std::string(PyBytes_AsString(key), PyBytes_Size(key));
-      }
-      if (resource_name == std::string("CPU")) {
-        found_CPU_requirements = true;
-      }
-      required_resources[resource_name] = PyFloat_AsDouble(value);
-    }
-  }
-  if (!found_CPU_requirements) {
-    required_resources["CPU"] = 1.0;
-  }
-
-  Py_ssize_t num_args = PyList_Size(arguments);
-
-  bool use_raylet = false;
-  if (use_raylet_object != nullptr && PyObject_IsTrue(use_raylet_object) == 1) {
-    use_raylet = true;
-  }
-  self->spec = nullptr;
-  self->task_spec = nullptr;
-
-  // Create the task spec.
-  if (!use_raylet) {
-    // The non-raylet code path.
-
-    // Construct the task specification.
-    TaskSpec_start_construct(
-        g_task_builder, driver_id, parent_task_id, parent_counter,
-        actor_creation_id, actor_creation_dummy_object_id, actor_id,
-        actor_handle_id, actor_counter, is_actor_checkpoint_method, function_id,
-        num_returns);
-    // Add the task arguments.
-    for (Py_ssize_t i = 0; i < num_args; ++i) {
-      PyObject *arg = PyList_GetItem(arguments, i);
-      if (PyObject_IsInstance(arg,
-                              reinterpret_cast<PyObject *>(&PyObjectIDType))) {
-        TaskSpec_args_add_ref(g_task_builder,
-                              &(reinterpret_cast<PyObjectID *>(arg))->object_id,
-                              1);
-      } else {
-        PyObject *data = PyObject_CallMethodObjArgs(pickle_module, pickle_dumps,
-                                                    arg, pickle_protocol, NULL);
-        TaskSpec_args_add_val(
-            g_task_builder, reinterpret_cast<uint8_t *>(PyBytes_AsString(data)),
-            PyBytes_Size(data));
-        Py_DECREF(data);
-      }
-    }
-    // Set the resource requirements for the task.
-    for (auto const &resource_pair : required_resources) {
-      TaskSpec_set_required_resource(g_task_builder, resource_pair.first,
-                                     resource_pair.second);
-    }
-
-    // Compute the task ID and the return object IDs.
-    self->spec = TaskSpec_finish_construct(g_task_builder, &self->size);
-
-  } else {
-    // The raylet code path.
-
-    // Parse the arguments from the list.
-    std::vector<std::shared_ptr<ray::raylet::TaskArgument>> args;
-    for (Py_ssize_t i = 0; i < num_args; ++i) {
-      PyObject *arg = PyList_GetItem(arguments, i);
-      if (PyObject_IsInstance(arg,
-                              reinterpret_cast<PyObject *>(&PyObjectIDType))) {
-        std::vector<ObjectID> references = {
-            reinterpret_cast<PyObjectID *>(arg)->object_id};
-        args.push_back(
-            std::make_shared<ray::raylet::TaskArgumentByReference>(references));
-      } else {
-        PyObject *data = PyObject_CallMethodObjArgs(pickle_module, pickle_dumps,
-                                                    arg, pickle_protocol, NULL);
-        args.push_back(std::make_shared<ray::raylet::TaskArgumentByValue>(
-            reinterpret_cast<uint8_t *>(PyBytes_AsString(data)),
-            PyBytes_Size(data)));
-        Py_DECREF(data);
-      }
-    }
-
-    self->task_spec = new ray::raylet::TaskSpecification(
-        driver_id, parent_task_id, parent_counter, actor_creation_id,
-        actor_creation_dummy_object_id, actor_id, actor_handle_id,
-        actor_counter, function_id, args, num_returns, required_resources,
-        Language::PYTHON);
-  }
-
-  /* Set the task's execution dependencies. */
-  self->execution_dependencies = new std::vector<ObjectID>();
-  if (execution_arguments != NULL) {
-    Py_ssize_t num_execution_args = PyList_Size(execution_arguments);
-    for (Py_ssize_t i = 0; i < num_execution_args; ++i) {
-      PyObject *execution_arg = PyList_GetItem(execution_arguments, i);
-      if (!PyObject_IsInstance(execution_arg, (PyObject *) &PyObjectIDType)) {
-        PyErr_SetString(PyExc_TypeError,
-                        "Execution arguments must be an ObjectID.");
-        return -1;
-      }
-      self->execution_dependencies->push_back(
-          ((PyObjectID *) execution_arg)->object_id);
-    }
-  }
-
-  return 0;
-}
-
-static void PyTask_dealloc(PyTask *self) {
-  if (!use_raylet(self)) {
-    TaskSpec_free(self->spec);
-  } else {
-    delete self->task_spec;
-  }
-  delete self->execution_dependencies;
-  Py_TYPE(self)->tp_free(reinterpret_cast<PyObject *>(self));
-}
-
-static PyObject *PyTask_function_id(PyTask *self) {
-  FunctionID function_id;
-  if (!use_raylet(self)) {
-    function_id = TaskSpec_function(self->spec);
-  } else {
-    function_id = self->task_spec->FunctionId();
-  }
-  return PyObjectID_make(function_id);
-}
-
-static PyObject *PyTask_actor_id(PyTask *self) {
-  ActorID actor_id;
-  if (!use_raylet(self)) {
-    actor_id = TaskSpec_actor_id(self->spec);
-  } else {
-    actor_id = self->task_spec->ActorId();
-  }
-  return PyObjectID_make(actor_id);
-}
-
-static PyObject *PyTask_actor_counter(PyTask *self) {
-  int64_t actor_counter;
-  if (!use_raylet(self)) {
-    actor_counter = TaskSpec_actor_counter(self->spec);
-  } else {
-    actor_counter = self->task_spec->ActorCounter();
-  }
-  return PyLong_FromLongLong(actor_counter);
-}
-
-static PyObject *PyTask_driver_id(PyTask *self) {
-  UniqueID driver_id;
-  if (!use_raylet(self)) {
-    driver_id = TaskSpec_driver_id(self->spec);
-  } else {
-    driver_id = self->task_spec->DriverId();
-  }
-  return PyObjectID_make(driver_id);
-}
-
-static PyObject *PyTask_task_id(PyTask *self) {
-  TaskID task_id;
-  if (!use_raylet(self)) {
-    task_id = TaskSpec_task_id(self->spec);
-  } else {
-    task_id = self->task_spec->TaskId();
-  }
-  return PyObjectID_make(task_id);
-}
-
-static PyObject *PyTask_parent_task_id(PyTask *self) {
-  TaskID task_id;
-  if (!use_raylet(self)) {
-    task_id = TaskSpec_parent_task_id(self->spec);
-  } else {
-    task_id = self->task_spec->ParentTaskId();
-  }
-  return PyObjectID_make(task_id);
-}
-
-static PyObject *PyTask_parent_counter(PyTask *self) {
-  int64_t parent_counter;
-  if (!use_raylet(self)) {
-    parent_counter = TaskSpec_parent_counter(self->spec);
-  } else {
-    parent_counter = self->task_spec->ParentCounter();
-  }
-  return PyLong_FromLongLong(parent_counter);
-}
-
-static PyObject *PyTask_arguments(PyTask *self) {
-  TaskSpec *task = self->spec;
-  ray::raylet::TaskSpecification *task_spec = self->task_spec;
-
-  int64_t num_args;
-  if (!use_raylet(self)) {
-    num_args = TaskSpec_num_args(task);
-  } else {
-    num_args = self->task_spec->NumArgs();
-  }
-
-  PyObject *arg_list = PyList_New((Py_ssize_t) num_args);
-  for (int i = 0; i < num_args; ++i) {
-    int count;
-    if (!use_raylet(self)) {
-      count = TaskSpec_arg_id_count(task, i);
-    } else {
-      count = task_spec->ArgIdCount(i);
-    }
-
-    if (count > 0) {
-      assert(count == 1);
-
-      ObjectID object_id;
-      if (!use_raylet(self)) {
-        object_id = TaskSpec_arg_id(task, i, 0);
-      } else {
-        object_id = task_spec->ArgId(i, 0);
-      }
-
-      PyList_SetItem(arg_list, i, PyObjectID_make(object_id));
-    } else {
-      RAY_CHECK(pickle_module != NULL);
-      RAY_CHECK(pickle_loads != NULL);
-
-      const uint8_t *arg_val;
-      int64_t arg_length;
-      if (!use_raylet(self)) {
-        arg_val = TaskSpec_arg_val(task, i);
-        arg_length = TaskSpec_arg_length(task, i);
-      } else {
-        arg_val = task_spec->ArgVal(i);
-        arg_length = task_spec->ArgValLength(i);
-      }
-
-      PyObject *str =
-          PyBytes_FromStringAndSize(reinterpret_cast<const char *>(arg_val),
-                                    static_cast<Py_ssize_t>(arg_length));
-      PyObject *val =
-          PyObject_CallMethodObjArgs(pickle_module, pickle_loads, str, NULL);
-      Py_XDECREF(str);
-      PyList_SetItem(arg_list, i, val);
-    }
-  }
-  return arg_list;
-}
-
-static PyObject *PyTask_actor_creation_id(PyTask *self) {
-  ActorID actor_creation_id;
-  if (!use_raylet(self)) {
-    actor_creation_id = TaskSpec_actor_creation_id(self->spec);
-  } else {
-    actor_creation_id = self->task_spec->ActorCreationId();
-  }
-  return PyObjectID_make(actor_creation_id);
-}
-
-static PyObject *PyTask_actor_creation_dummy_object_id(PyTask *self) {
-  ObjectID actor_creation_dummy_object_id;
-  if (!use_raylet(self)) {
-    if (TaskSpec_is_actor_task(self->spec)) {
-      actor_creation_dummy_object_id =
-          TaskSpec_actor_creation_dummy_object_id(self->spec);
-    } else {
-      actor_creation_dummy_object_id = ObjectID::nil();
-    }
-  } else {
-    actor_creation_dummy_object_id =
-        self->task_spec->ActorCreationDummyObjectId();
-  }
-  return PyObjectID_make(actor_creation_dummy_object_id);
-}
-
-static PyObject *PyTask_required_resources(PyTask *self) {
-  PyObject *required_resources = PyDict_New();
-
-  std::unordered_map<std::string, double> resource_map;
-  if (!use_raylet(self)) {
-    resource_map = TaskSpec_get_required_resources(self->spec);
-  } else {
-    resource_map = self->task_spec->GetRequiredResources().GetResourceMap();
-  }
-
-  for (auto const &resource_pair : resource_map) {
-    std::string resource_name = resource_pair.first;
-#if PY_MAJOR_VERSION >= 3
-    PyObject *key =
-        PyUnicode_FromStringAndSize(resource_name.data(), resource_name.size());
-#else
-    PyObject *key =
-        PyBytes_FromStringAndSize(resource_name.data(), resource_name.size());
-#endif
-    PyObject *value = PyFloat_FromDouble(resource_pair.second);
-    PyDict_SetItem(required_resources, key, value);
-    Py_DECREF(key);
-    Py_DECREF(value);
-  }
-  return required_resources;
-}
-
-static PyObject *PyTask_returns(PyTask *self) {
-  TaskSpec *task = self->spec;
-  ray::raylet::TaskSpecification *task_spec = self->task_spec;
-
-  int64_t num_returns;
-  if (!use_raylet(self)) {
-    num_returns = TaskSpec_num_returns(task);
-  } else {
-    num_returns = task_spec->NumReturns();
-  }
-
-  PyObject *return_id_list = PyList_New((Py_ssize_t) num_returns);
-  for (int i = 0; i < num_returns; ++i) {
-    ObjectID object_id;
-    if (!use_raylet(self)) {
-      object_id = TaskSpec_return(task, i);
-    } else {
-      object_id = task_spec->ReturnId(i);
-    }
-    PyList_SetItem(return_id_list, i, PyObjectID_make(object_id));
-  }
-  return return_id_list;
-}
-
-static PyObject *PyTask_execution_dependencies_string(PyTask *self) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto execution_dependencies = CreateTaskExecutionDependencies(
-      fbb, to_flatbuf(fbb, *self->execution_dependencies));
-  fbb.Finish(execution_dependencies);
-  return PyBytes_FromStringAndSize((char *) fbb.GetBufferPointer(),
-                                   fbb.GetSize());
-}
-
-static PyObject *PyTask_to_serialized_flatbuf(PyTask *self) {
-  RAY_CHECK(use_raylet(self));
-
-  const std::vector<ObjectID> execution_dependencies(
-      *self->execution_dependencies);
-  auto const execution_spec = ray::raylet::TaskExecutionSpecification(
-      std::move(execution_dependencies));
-  auto const task = ray::raylet::Task(execution_spec, *self->task_spec);
-
-  flatbuffers::FlatBufferBuilder fbb;
-  auto task_flatbuffer = task.ToFlatbuffer(fbb);
-  fbb.Finish(task_flatbuffer);
-
-  return PyBytes_FromStringAndSize(
-      reinterpret_cast<char *>(fbb.GetBufferPointer()), fbb.GetSize());
-}
-
-static PyMethodDef PyTask_methods[] = {
-    {"function_id", (PyCFunction) PyTask_function_id, METH_NOARGS,
-     "Return the function ID for this task."},
-    {"parent_task_id", (PyCFunction) PyTask_parent_task_id, METH_NOARGS,
-     "Return the task ID of the parent task."},
-    {"parent_counter", (PyCFunction) PyTask_parent_counter, METH_NOARGS,
-     "Return the parent counter of this task."},
-    {"actor_id", (PyCFunction) PyTask_actor_id, METH_NOARGS,
-     "Return the actor ID for this task."},
-    {"actor_counter", (PyCFunction) PyTask_actor_counter, METH_NOARGS,
-     "Return the actor counter for this task."},
-    {"driver_id", (PyCFunction) PyTask_driver_id, METH_NOARGS,
-     "Return the driver ID for this task."},
-    {"task_id", (PyCFunction) PyTask_task_id, METH_NOARGS,
-     "Return the task ID for this task."},
-    {"arguments", (PyCFunction) PyTask_arguments, METH_NOARGS,
-     "Return the arguments for the task."},
-    {"actor_creation_id", (PyCFunction) PyTask_actor_creation_id, METH_NOARGS,
-     "Return the actor creation ID for the task."},
-    {"actor_creation_dummy_object_id",
-     (PyCFunction) PyTask_actor_creation_dummy_object_id, METH_NOARGS,
-     "Return the actor creation dummy object ID for the task."},
-    {"required_resources", (PyCFunction) PyTask_required_resources, METH_NOARGS,
-     "Return the resource vector of the task."},
-    {"returns", (PyCFunction) PyTask_returns, METH_NOARGS,
-     "Return the object IDs for the return values of the task."},
-    {"execution_dependencies_string",
-     (PyCFunction) PyTask_execution_dependencies_string, METH_NOARGS,
-     "Return the execution dependencies for the task as a string."},
-    {"_serialized_raylet_task", (PyCFunction) PyTask_to_serialized_flatbuf,
-     METH_NOARGS,
-     "This is a hack used to create a serialized flatbuffer object for the "
-     "driver task. We're doing this because creating the flatbuffer object in "
-     "Python didn't seem to work."},
-    {NULL} /* Sentinel */
-};
-
-PyTypeObject PyTaskType = {
-    PyVarObject_HEAD_INIT(NULL, 0) /* ob_size */
-    "task.Task",                   /* tp_name */
-    sizeof(PyTask),                /* tp_basicsize */
-    0,                             /* tp_itemsize */
-    (destructor) PyTask_dealloc,   /* tp_dealloc */
-    0,                             /* tp_print */
-    0,                             /* tp_getattr */
-    0,                             /* tp_setattr */
-    0,                             /* tp_compare */
-    0,                             /* tp_repr */
-    0,                             /* tp_as_number */
-    0,                             /* tp_as_sequence */
-    0,                             /* tp_as_mapping */
-    0,                             /* tp_hash */
-    0,                             /* tp_call */
-    0,                             /* tp_str */
-    0,                             /* tp_getattro */
-    0,                             /* tp_setattro */
-    0,                             /* tp_as_buffer */
-    Py_TPFLAGS_DEFAULT,            /* tp_flags */
-    "Task object",                 /* tp_doc */
-    0,                             /* tp_traverse */
-    0,                             /* tp_clear */
-    0,                             /* tp_richcompare */
-    0,                             /* tp_weaklistoffset */
-    0,                             /* tp_iter */
-    0,                             /* tp_iternext */
-    PyTask_methods,                /* tp_methods */
-    0,                             /* tp_members */
-    0,                             /* tp_getset */
-    0,                             /* tp_base */
-    0,                             /* tp_dict */
-    0,                             /* tp_descr_get */
-    0,                             /* tp_descr_set */
-    0,                             /* tp_dictoffset */
-    (initproc) PyTask_init,        /* tp_init */
-    0,                             /* tp_alloc */
-    PyType_GenericNew,             /* tp_new */
-};
-
-/* Create a PyTask from a C struct. The resulting PyTask takes ownership of the
- * TaskSpec and will deallocate the TaskSpec in the PyTask destructor. */
-PyObject *PyTask_make(TaskSpec *task_spec, int64_t task_size) {
-  PyTask *result = PyObject_New(PyTask, &PyTaskType);
-  result = (PyTask *) PyObject_Init((PyObject *) result, &PyTaskType);
-  result->spec = task_spec;
-  result->size = task_size;
-  /* The created task does not include any execution dependencies. */
-  result->execution_dependencies = new std::vector<ObjectID>();
-  return (PyObject *) result;
-}
-
-/* Define the methods for the module. */
-
-/**
- * This method checks if a Python object is sufficiently simple that it can be
- * serialized and passed by value as an argument to a task (without being put in
- * the object store). The details of which objects are sufficiently simple are
- * defined by this method and are not particularly important. But for
- * performance reasons, it is better to place "small" objects in the task itself
- * and "large" objects in the object store.
- *
- * @param value The Python object in question.
- * @param num_elements_contained If this method returns 1, then the number of
- *        objects recursively contained within this object will be added to the
- *        value at this address. This is used to make sure that we do not
- *        serialize objects that are too large.
- * @return False if the object cannot be serialized in the task and true if it
- *         can.
- */
-bool is_simple_value(PyObject *value, int *num_elements_contained) {
-  *num_elements_contained += 1;
-  if (*num_elements_contained >= RayConfig::instance().num_elements_limit()) {
-    return false;
-  }
-  if (PyInt_Check(value) || PyLong_Check(value) || value == Py_False ||
-      value == Py_True || PyFloat_Check(value) || value == Py_None) {
-    return true;
-  }
-  if (PyBytes_CheckExact(value)) {
-    *num_elements_contained += PyBytes_Size(value);
-    return (*num_elements_contained <
-            RayConfig::instance().num_elements_limit());
-  }
-  if (PyUnicode_CheckExact(value)) {
-    *num_elements_contained += PyUnicode_GET_SIZE(value);
-    return (*num_elements_contained <
-            RayConfig::instance().num_elements_limit());
-  }
-  if (PyList_CheckExact(value) &&
-      PyList_Size(value) < RayConfig::instance().size_limit()) {
-    for (Py_ssize_t i = 0; i < PyList_Size(value); ++i) {
-      if (!is_simple_value(PyList_GetItem(value, i), num_elements_contained)) {
-        return false;
-      }
-    }
-    return (*num_elements_contained <
-            RayConfig::instance().num_elements_limit());
-  }
-  if (PyDict_CheckExact(value) &&
-      PyDict_Size(value) < RayConfig::instance().size_limit()) {
-    PyObject *key, *val;
-    Py_ssize_t pos = 0;
-    while (PyDict_Next(value, &pos, &key, &val)) {
-      if (!is_simple_value(key, num_elements_contained) ||
-          !is_simple_value(val, num_elements_contained)) {
-        return false;
-      }
-    }
-    return (*num_elements_contained <
-            RayConfig::instance().num_elements_limit());
-  }
-  if (PyTuple_CheckExact(value) &&
-      PyTuple_Size(value) < RayConfig::instance().size_limit()) {
-    for (Py_ssize_t i = 0; i < PyTuple_Size(value); ++i) {
-      if (!is_simple_value(PyTuple_GetItem(value, i), num_elements_contained)) {
-        return false;
-      }
-    }
-    return (*num_elements_contained <
-            RayConfig::instance().num_elements_limit());
-  }
-  if (PyArray_CheckExact(value)) {
-    PyArrayObject *array = reinterpret_cast<PyArrayObject *>(value);
-    if (PyArray_TYPE(array) == NPY_OBJECT) {
-      return false;
-    }
-    *num_elements_contained += PyArray_NBYTES(array);
-    return (*num_elements_contained <
-            RayConfig::instance().num_elements_limit());
-  }
-  return false;
-}
-
-PyObject *check_simple_value(PyObject *self, PyObject *args) {
-  PyObject *value;
-  if (!PyArg_ParseTuple(args, "O", &value)) {
-    return NULL;
-  }
-  int num_elements_contained = 0;
-  if (is_simple_value(value, &num_elements_contained)) {
-    Py_RETURN_TRUE;
-  }
-  Py_RETURN_FALSE;
-}
-
-PyObject *compute_task_id(PyObject *self, PyObject *args) {
-  ObjectID object_id;
-  if (!PyArg_ParseTuple(args, "O&", &PyObjectToUniqueID, &object_id)) {
-    return NULL;
-  }
-  TaskID task_id = ray::ComputeTaskId(object_id);
-  return PyObjectID_make(task_id);
-}
diff --git a/src/common/logging.cc b/src/common/logging.cc
deleted file mode 100644
index 9802dd3d03f3a..0000000000000
--- a/src/common/logging.cc
+++ /dev/null
@@ -1,107 +0,0 @@
-#include "logging.h"
-
-#include <inttypes.h>
-#include <stdint.h>
-#include <sys/time.h>
-
-#include <hiredis/hiredis.h>
-
-#include "state/redis.h"
-#include "io.h"
-#include <iostream>
-#include <string>
-
-static const char *log_levels[5] = {"DEBUG", "INFO", "WARN", "ERROR", "FATAL"};
-static const char *log_fmt =
-    "HMSET log:%s:%s log_level %s event_type %s message %s timestamp %s";
-
-struct RayLoggerImpl {
-  /* String that identifies this client type. */
-  const char *client_type;
-  /* Suppress all log messages below this level. */
-  int log_level;
-  /* Whether or not we have a direct connection to Redis. */
-  int is_direct;
-  /* Either a db_handle or a socket to a process with a db_handle,
-   * depending on the is_direct flag. */
-  void *conn;
-};
-
-RayLogger *RayLogger_init(const char *client_type,
-                          int log_level,
-                          int is_direct,
-                          void *conn) {
-  RayLogger *logger = (RayLogger *) malloc(sizeof(RayLogger));
-  logger->client_type = client_type;
-  logger->log_level = log_level;
-  logger->is_direct = is_direct;
-  logger->conn = conn;
-  return logger;
-}
-
-void RayLogger_free(RayLogger *logger) {
-  free(logger);
-}
-
-void RayLogger_log(RayLogger *logger,
-                   int log_level,
-                   const char *event_type,
-                   const char *message) {
-  if (log_level < logger->log_level) {
-    return;
-  }
-  if (log_level < RAY_LOG_DEBUG || log_level > RAY_LOG_FATAL) {
-    return;
-  }
-  struct timeval tv;
-  gettimeofday(&tv, NULL);
-  std::string timestamp =
-      std::to_string(tv.tv_sec) + "." + std::to_string(tv.tv_usec);
-
-  /* Find number of bytes that would have been written for formatted_message
-   * size */
-  size_t formatted_message_size =
-      std::snprintf(nullptr, 0, log_fmt, timestamp.c_str(), "%b",
-                    log_levels[log_level], event_type, message,
-                    timestamp.c_str()) +
-      1;
-  /* Fill out everything except the client ID, which is binary data. */
-  char formatted_message[formatted_message_size];
-  std::snprintf(formatted_message, formatted_message_size, log_fmt,
-                timestamp.c_str(), "%b", log_levels[log_level], event_type,
-                message, timestamp.c_str());
-
-  if (logger->is_direct) {
-    DBHandle *db = (DBHandle *) logger->conn;
-    /* Fill in the client ID and send the message to Redis. */
-
-    redisAsyncContext *context = get_redis_context(db, db->client);
-
-    int status =
-        redisAsyncCommand(context, NULL, NULL, formatted_message,
-                          (char *) db->client.data(), sizeof(db->client));
-    if ((status == REDIS_ERR) || context->err) {
-      LOG_REDIS_DEBUG(context, "error while logging message to log table");
-    }
-  } else {
-    /* If we don't own a Redis connection, we leave our client
-     * ID to be filled in by someone else. */
-    int *socket_fd = (int *) logger->conn;
-    write_log_message(*socket_fd, formatted_message);
-  }
-}
-
-void RayLogger_log_event(DBHandle *db,
-                         uint8_t *key,
-                         int64_t key_length,
-                         uint8_t *value,
-                         int64_t value_length,
-                         double timestamp) {
-  std::string timestamp_string = std::to_string(timestamp);
-  int status = redisAsyncCommand(db->context, NULL, NULL, "ZADD %b %s %b", key,
-                                 key_length, timestamp_string.c_str(), value,
-                                 value_length);
-  if ((status == REDIS_ERR) || db->context->err) {
-    LOG_REDIS_DEBUG(db->context, "error while logging message to event log");
-  }
-}
diff --git a/src/common/logging.h b/src/common/logging.h
deleted file mode 100644
index 1fa57a60c7123..0000000000000
--- a/src/common/logging.h
+++ /dev/null
@@ -1,58 +0,0 @@
-#ifndef LOGGING_H
-#define LOGGING_H
-
-#define RAY_LOG_VERBOSE -1
-#define RAY_LOG_DEBUG 0
-#define RAY_LOG_INFO 1
-#define RAY_LOG_WARNING 2
-#define RAY_LOG_ERROR 3
-#define RAY_LOG_FATAL 4
-
-/* Entity types. */
-#define RAY_FUNCTION "FUNCTION"
-#define RAY_OBJECT "OBJECT"
-#define RAY_TASK "TASK"
-
-#include "state/db.h"
-
-typedef struct RayLoggerImpl RayLogger;
-
-/* Initialize a Ray logger for the given client type and logging level. If the
- * is_direct flag is set, the logger will treat the given connection as a
- * direct connection to the log. Otherwise, it will treat it as a socket to
- * another process with a connection to the log.
- * NOTE: User is responsible for freeing the returned logger. */
-RayLogger *RayLogger_init(const char *client_type,
-                          int log_level,
-                          int is_direct,
-                          void *conn);
-
-/* Free the logger. This does not free the connection to the log. */
-void RayLogger_free(RayLogger *logger);
-
-/* Log an event at the given log level with the given event_type.
- * NOTE: message cannot contain spaces! JSON format is recommended.
- * TODO: Support spaces in messages. */
-void RayLogger_log(RayLogger *logger,
-                   int log_level,
-                   const char *event_type,
-                   const char *message);
-
-/**
- * Log an event to the event log.
- *
- * @param db The database handle.
- * @param key The key in Redis to store the event in.
- * @param key_length The length of the key.
- * @param value The value to log.
- * @param value_length The length of the value.
- * @return Void.
- */
-void RayLogger_log_event(DBHandle *db,
-                         uint8_t *key,
-                         int64_t key_length,
-                         uint8_t *value,
-                         int64_t value_length,
-                         double time);
-
-#endif /* LOGGING_H */
diff --git a/src/common/net.cc b/src/common/net.cc
deleted file mode 100644
index 3f2aaf6fa94e5..0000000000000
--- a/src/common/net.cc
+++ /dev/null
@@ -1,24 +0,0 @@
-#include "net.h"
-
-#include <arpa/inet.h>
-
-#include <sstream>
-
-#include "common.h"
-
-int parse_ip_addr_port(const char *ip_addr_port, char *ip_addr, int *port) {
-  char port_str[6];
-  int parsed = sscanf(ip_addr_port, "%15[0-9.]:%5[0-9]", ip_addr, port_str);
-  if (parsed != 2) {
-    return -1;
-  }
-  *port = atoi(port_str);
-  return 0;
-}
-
-/* Return true if the ip address is valid. */
-bool valid_ip_address(const std::string &ip_address) {
-  struct sockaddr_in sa;
-  int result = inet_pton(AF_INET, ip_address.c_str(), &sa.sin_addr);
-  return result == 1;
-}
diff --git a/src/common/net.h b/src/common/net.h
deleted file mode 100644
index 109cdf3fa1f33..0000000000000
--- a/src/common/net.h
+++ /dev/null
@@ -1,9 +0,0 @@
-#ifndef NET_H
-#define NET_H
-
-/* Helper function to parse a string of the form <IP address>:<port> into the
- * given ip_addr and port pointers. The ip_addr buffer must already be
- * allocated. Return 0 upon success and -1 upon failure. */
-int parse_ip_addr_port(const char *ip_addr_port, char *ip_addr, int *port);
-
-#endif /* NET_H */
diff --git a/src/common/redis_module/ray_redis_module.cc b/src/common/redis_module/ray_redis_module.cc
deleted file mode 100644
index d594f74effef0..0000000000000
--- a/src/common/redis_module/ray_redis_module.cc
+++ /dev/null
@@ -1,1886 +0,0 @@
-#include <string.h>
-
-#include "common_protocol.h"
-#include "format/common_generated.h"
-#include "ray/gcs/format/gcs_generated.h"
-#include "ray/id.h"
-#include "redis_string.h"
-#include "redismodule.h"
-#include "task.h"
-
-#if RAY_USE_NEW_GCS
-// Under this flag, ray-project/credis will be loaded.  Specifically, via
-// "path/redis-server --loadmodule <credis module> --loadmodule <current
-// libray_redis_module>" (dlopen() under the hood) will a definition of "module"
-// be supplied.
-//
-// All commands in this file that depend on "module" must be wrapped by "#if
-// RAY_USE_NEW_GCS", until we switch to this launch configuration as the
-// default.
-#include "chain_module.h"
-extern RedisChainModule module;
-#endif
-
-// Various tables are maintained in redis:
-//
-// == OBJECT TABLE ==
-//
-// This consists of two parts:
-// - The object location table, indexed by OL:object_id, which is the set of
-//   plasma manager indices that have access to the object.
-//   (In redis this is represented by a zset (sorted set).)
-//
-// - The object info table, indexed by OI:object_id, which is a hashmap of:
-//     "hash" -> the hash of the object,
-//     "data_size" -> the size of the object in bytes,
-//     "task" -> the task ID that generated this object.
-//     "is_put" -> 0 or 1.
-//
-// == TASK TABLE ==
-//
-// It maps each TT:task_id to a hash:
-//   "state" -> the state of the task, encoded as a bit mask of scheduling_state
-//              enum values in task.h,
-//   "local_scheduler_id" -> the ID of the local scheduler the task is assigned
-//                           to,
-//   "TaskSpec" -> serialized bytes of a TaskInfo (defined in common.fbs), which
-//                 describes the details this task.
-//
-// See also the definition of TaskReply in common.fbs.
-
-#define OBJECT_INFO_PREFIX "OI:"
-#define OBJECT_LOCATION_PREFIX "OL:"
-#define OBJECT_NOTIFICATION_PREFIX "ON:"
-#define TASK_PREFIX "TT:"
-#define OBJECT_BCAST "BCAST"
-
-#define OBJECT_CHANNEL_PREFIX "OC:"
-
-#define CHECK_ERROR(STATUS, MESSAGE)                   \
-  if ((STATUS) == REDISMODULE_ERR) {                   \
-    return RedisModule_ReplyWithError(ctx, (MESSAGE)); \
-  }
-
-/// Parse a Redis string into a TablePubsub channel.
-TablePubsub ParseTablePubsub(const RedisModuleString *pubsub_channel_str) {
-  long long pubsub_channel_long;
-  RAY_CHECK(RedisModule_StringToLongLong(
-                pubsub_channel_str, &pubsub_channel_long) == REDISMODULE_OK)
-      << "Pubsub channel must be a valid TablePubsub";
-  auto pubsub_channel = static_cast<TablePubsub>(pubsub_channel_long);
-  RAY_CHECK(pubsub_channel >= TablePubsub::MIN &&
-            pubsub_channel <= TablePubsub::MAX)
-      << "Pubsub channel must be a valid TablePubsub";
-  return pubsub_channel;
-}
-
-/// Format a pubsub channel for a specific key. pubsub_channel_str should
-/// contain a valid TablePubsub.
-RedisModuleString *FormatPubsubChannel(
-    RedisModuleCtx *ctx,
-    const RedisModuleString *pubsub_channel_str,
-    const RedisModuleString *id) {
-  // Format the pubsub channel enum to a string. TablePubsub_MAX should be more
-  // than enough digits, but add 1 just in case for the null terminator.
-  char pubsub_channel[static_cast<int>(TablePubsub::MAX) + 1];
-  sprintf(pubsub_channel, "%d",
-          static_cast<int>(ParseTablePubsub(pubsub_channel_str)));
-  return RedisString_Format(ctx, "%s:%S", pubsub_channel, id);
-}
-
-// TODO(swang): This helper function should be deprecated by the version below,
-// which uses enums for table prefixes.
-RedisModuleKey *OpenPrefixedKey(RedisModuleCtx *ctx,
-                                const char *prefix,
-                                RedisModuleString *keyname,
-                                int mode,
-                                RedisModuleString **mutated_key_str) {
-  RedisModuleString *prefixed_keyname =
-      RedisString_Format(ctx, "%s%S", prefix, keyname);
-  // Pass out the key being mutated, should the caller request so.
-  if (mutated_key_str != nullptr) {
-    *mutated_key_str = prefixed_keyname;
-  }
-  RedisModuleKey *key =
-      (RedisModuleKey *) RedisModule_OpenKey(ctx, prefixed_keyname, mode);
-  return key;
-}
-
-RedisModuleKey *OpenPrefixedKey(RedisModuleCtx *ctx,
-                                RedisModuleString *prefix_enum,
-                                RedisModuleString *keyname,
-                                int mode,
-                                RedisModuleString **mutated_key_str) {
-  long long prefix_long;
-  RAY_CHECK(RedisModule_StringToLongLong(prefix_enum, &prefix_long) ==
-            REDISMODULE_OK)
-      << "Prefix must be a valid TablePrefix";
-  auto prefix = static_cast<TablePrefix>(prefix_long);
-  RAY_CHECK(prefix != TablePrefix::UNUSED)
-      << "This table has no prefix registered";
-  RAY_CHECK(prefix >= TablePrefix::MIN && prefix <= TablePrefix::MAX)
-      << "Prefix must be a valid TablePrefix";
-  return OpenPrefixedKey(ctx, EnumNameTablePrefix(prefix), keyname, mode,
-                         mutated_key_str);
-}
-
-RedisModuleKey *OpenPrefixedKey(RedisModuleCtx *ctx,
-                                const char *prefix,
-                                RedisModuleString *keyname,
-                                int mode) {
-  return OpenPrefixedKey(ctx, prefix, keyname, mode,
-                         /*mutated_key_str=*/nullptr);
-}
-
-RedisModuleKey *OpenPrefixedKey(RedisModuleCtx *ctx,
-                                RedisModuleString *prefix_enum,
-                                RedisModuleString *keyname,
-                                int mode) {
-  return OpenPrefixedKey(ctx, prefix_enum, keyname, mode,
-                         /*mutated_key_str=*/nullptr);
-}
-
-/// Open the key used to store the channels that should be published to when an
-/// update happens at the given keyname.
-RedisModuleKey *OpenBroadcastKey(RedisModuleCtx *ctx,
-                                 RedisModuleString *pubsub_channel_str,
-                                 RedisModuleString *keyname,
-                                 int mode) {
-  RedisModuleString *channel =
-      FormatPubsubChannel(ctx, pubsub_channel_str, keyname);
-  RedisModuleString *prefixed_keyname =
-      RedisString_Format(ctx, "BCAST:%S", channel);
-  RedisModuleKey *key =
-      (RedisModuleKey *) RedisModule_OpenKey(ctx, prefixed_keyname, mode);
-  return key;
-}
-
-/**
- * This is a helper method to convert a redis module string to a flatbuffer
- * string.
- *
- * @param fbb The flatbuffer builder.
- * @param redis_string The redis string.
- * @return The flatbuffer string.
- */
-flatbuffers::Offset<flatbuffers::String> RedisStringToFlatbuf(
-    flatbuffers::FlatBufferBuilder &fbb,
-    RedisModuleString *redis_string) {
-  size_t redis_string_size;
-  const char *redis_string_str =
-      RedisModule_StringPtrLen(redis_string, &redis_string_size);
-  return fbb.CreateString(redis_string_str, redis_string_size);
-}
-
-/**
- * Publish a notification to a client's notification channel about an insertion
- * or deletion to the db client table.
- *
- * TODO(swang): Use flatbuffers for the notification message.
- * The format for the published notification is:
- *  <ray_client_id>:<client type> <manager_address> <is_insertion>
- * If no manager address is provided, manager_address will be set to ":". If
- * is_insertion is true, then the last field will be "1", else "0".
- *
- * @param ctx The Redis context.
- * @param ray_client_id The ID of the database client that was inserted or
- *        deleted.
- * @param client_type The type of client that was inserted or deleted.
- * @param manager_address An optional secondary address for the object manager
- *        associated with this database client.
- * @param is_insertion A boolean that's true if the update was an insertion and
- *        false if deletion.
- * @return True if the publish was successful and false otherwise.
- */
-bool PublishDBClientNotification(RedisModuleCtx *ctx,
-                                 RedisModuleString *ray_client_id,
-                                 RedisModuleString *client_type,
-                                 RedisModuleString *manager_address,
-                                 bool is_insertion) {
-  /* Construct strings to publish on the db client channel. */
-  RedisModuleString *channel_name =
-      RedisModule_CreateString(ctx, "db_clients", strlen("db_clients"));
-  /* Construct the flatbuffers object to publish over the channel. */
-  flatbuffers::FlatBufferBuilder fbb;
-  /* Use an empty aux address if one is not passed in. */
-  flatbuffers::Offset<flatbuffers::String> manager_address_str;
-  if (manager_address != NULL) {
-    manager_address_str = RedisStringToFlatbuf(fbb, manager_address);
-  } else {
-    manager_address_str = fbb.CreateString("", strlen(""));
-  }
-  /* Create the flatbuffers message. */
-  auto message = CreateSubscribeToDBClientTableReply(
-      fbb, RedisStringToFlatbuf(fbb, ray_client_id),
-      RedisStringToFlatbuf(fbb, client_type), manager_address_str,
-      is_insertion);
-  fbb.Finish(message);
-  /* Create a Redis string to publish by serializing the flatbuffers object. */
-  RedisModuleString *client_info = RedisModule_CreateString(
-      ctx, (const char *) fbb.GetBufferPointer(), fbb.GetSize());
-
-  /* Publish the client info on the db client channel. */
-  RedisModuleCallReply *reply;
-  reply = RedisModule_Call(ctx, "PUBLISH", "ss", channel_name, client_info);
-  return (reply != NULL);
-}
-
-/**
- * Register a client with Redis. This is called from a client with the command:
- *
- *     RAY.CONNECT <ray client id> <node ip address> <client type> <field 1>
- *         <value 1> <field 2> <value 2> ...
- *
- * The command can take an arbitrary number of pairs of field names and keys,
- * and these will be stored in a hashmap associated with this client. Several
- * fields are singled out for special treatment:
- *
- *     manager_address: This is provided by local schedulers and plasma
- *         managers and should be the address of the plasma manager that the
- *         client is associated with.  This is published to the "db_clients"
- *         channel by the RAY.CONNECT command.
- *
- * @param ray_client_id The db client ID of the client.
- * @param node_ip_address The IP address of the node the client is on.
- * @param client_type The type of the client (e.g., plasma_manager).
- * @return OK if the operation was successful.
- */
-int Connect_RedisCommand(RedisModuleCtx *ctx,
-                         RedisModuleString **argv,
-                         int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc < 4) {
-    return RedisModule_WrongArity(ctx);
-  }
-  if (argc % 2 != 0) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  RedisModuleString *ray_client_id = argv[1];
-  RedisModuleString *node_ip_address = argv[2];
-  RedisModuleString *client_type = argv[3];
-
-  /* Add this client to the Ray db client table. */
-  RedisModuleKey *db_client_table_key =
-      OpenPrefixedKey(ctx, DB_CLIENT_PREFIX, ray_client_id, REDISMODULE_WRITE);
-
-  if (RedisModule_KeyType(db_client_table_key) != REDISMODULE_KEYTYPE_EMPTY) {
-    return RedisModule_ReplyWithError(ctx, "Client already exists");
-  }
-
-  /* This will be used to construct a publish message. */
-  RedisModuleString *manager_address = NULL;
-  RedisModuleString *manager_address_key = RedisModule_CreateString(
-      ctx, "manager_address", strlen("manager_address"));
-  RedisModuleString *deleted = RedisModule_CreateString(ctx, "0", strlen("0"));
-
-  RedisModule_HashSet(db_client_table_key, REDISMODULE_HASH_CFIELDS,
-                      "ray_client_id", ray_client_id, "node_ip_address",
-                      node_ip_address, "client_type", client_type, "deleted",
-                      deleted, NULL);
-
-  for (int i = 4; i < argc; i += 2) {
-    RedisModuleString *key = argv[i];
-    RedisModuleString *value = argv[i + 1];
-    RedisModule_HashSet(db_client_table_key, REDISMODULE_HASH_NONE, key, value,
-                        NULL);
-    if (RedisModule_StringCompare(key, manager_address_key) == 0) {
-      manager_address = value;
-    }
-  }
-  /* Clean up. */
-  if (!PublishDBClientNotification(ctx, ray_client_id, client_type,
-                                   manager_address, true)) {
-    return RedisModule_ReplyWithError(ctx, "PUBLISH unsuccessful");
-  }
-
-  RedisModule_ReplyWithSimpleString(ctx, "OK");
-  return REDISMODULE_OK;
-}
-
-/**
- * Remove a client from Redis. This is called from a client with the command:
- *
- *     RAY.DISCONNECT <ray client id>
- *
- * This method also publishes a notification to all subscribers to the
- * db_clients channel. The notification consists of a message of the form "<ray
- * client id>:<client type>".
- *
- * @param ray_client_id The db client ID of the client.
- * @return OK if the operation was successful.
- */
-int Disconnect_RedisCommand(RedisModuleCtx *ctx,
-                            RedisModuleString **argv,
-                            int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc != 2) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  RedisModuleString *ray_client_id = argv[1];
-
-  /* Get the client type. */
-  RedisModuleKey *db_client_table_key =
-      OpenPrefixedKey(ctx, DB_CLIENT_PREFIX, ray_client_id, REDISMODULE_WRITE);
-
-  RedisModuleString *deleted_string;
-  RedisModule_HashGet(db_client_table_key, REDISMODULE_HASH_CFIELDS, "deleted",
-                      &deleted_string, NULL);
-  long long deleted;
-  int parsed = RedisModule_StringToLongLong(deleted_string, &deleted);
-  if (parsed != REDISMODULE_OK) {
-    return RedisModule_ReplyWithError(ctx, "Unable to parse deleted field");
-  }
-
-  bool published = true;
-  if (deleted == 0) {
-    /* Remove the client from the client table. */
-    RedisModuleString *deleted =
-        RedisModule_CreateString(ctx, "1", strlen("1"));
-    RedisModule_HashSet(db_client_table_key, REDISMODULE_HASH_CFIELDS,
-                        "deleted", deleted, NULL);
-
-    RedisModuleString *client_type;
-    RedisModuleString *manager_address;
-    RedisModule_HashGet(db_client_table_key, REDISMODULE_HASH_CFIELDS,
-                        "client_type", &client_type, "manager_address",
-                        &manager_address, NULL);
-
-    /* Publish the deletion notification on the db client channel. */
-    published = PublishDBClientNotification(ctx, ray_client_id, client_type,
-                                            manager_address, false);
-  }
-
-  if (!published) {
-    /* Return an error message if we weren't able to publish the deletion
-     * notification. */
-    return RedisModule_ReplyWithError(ctx, "PUBLISH unsuccessful");
-  }
-
-  RedisModule_ReplyWithSimpleString(ctx, "OK");
-  return REDISMODULE_OK;
-}
-
-/**
- * Lookup an entry in the object table.
- *
- * This is called from a client with the command:
- *
- *     RAY.OBJECT_TABLE_LOOKUP <object id>
- *
- * @param object_id A string representing the object ID.
- * @return A list, possibly empty, of plasma manager IDs that are listed in the
- *         object table as having the object. If there was no entry found in
- *         the object table, returns nil.
- */
-int ObjectTableLookup_RedisCommand(RedisModuleCtx *ctx,
-                                   RedisModuleString **argv,
-                                   int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc != 2) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  RedisModuleKey *key =
-      OpenPrefixedKey(ctx, OBJECT_LOCATION_PREFIX, argv[1], REDISMODULE_READ);
-
-  if (RedisModule_KeyType(key) == REDISMODULE_KEYTYPE_EMPTY) {
-    /* Return nil if no entry was found. */
-    return RedisModule_ReplyWithNull(ctx);
-  }
-  if (RedisModule_ValueLength(key) == 0) {
-    /* Return empty list if there are no managers. */
-    return RedisModule_ReplyWithArray(ctx, 0);
-  }
-
-  CHECK_ERROR(
-      RedisModule_ZsetFirstInScoreRange(key, REDISMODULE_NEGATIVE_INFINITE,
-                                        REDISMODULE_POSITIVE_INFINITE, 1, 1),
-      "Unable to initialize zset iterator");
-
-  RedisModule_ReplyWithArray(ctx, REDISMODULE_POSTPONED_ARRAY_LEN);
-  int num_results = 0;
-  do {
-    RedisModuleString *curr = RedisModule_ZsetRangeCurrentElement(key, NULL);
-    RedisModule_ReplyWithString(ctx, curr);
-    num_results += 1;
-  } while (RedisModule_ZsetRangeNext(key));
-  RedisModule_ReplySetArrayLength(ctx, num_results);
-
-  return REDISMODULE_OK;
-}
-
-/**
- * Publish a notification to a client's object notification channel if at least
- * one manager is listed as having the object in the object table.
- *
- * @param ctx The Redis context.
- * @param client_id The ID of the client that is being notified.
- * @param object_id The object ID of interest.
- * @param key The opened key for the entry in the object table corresponding to
- *        the object ID of interest.
- * @return True if the publish was successful and false otherwise.
- */
-bool PublishObjectNotification(RedisModuleCtx *ctx,
-                               RedisModuleString *client_id,
-                               RedisModuleString *object_id,
-                               RedisModuleString *data_size,
-                               RedisModuleKey *key) {
-  flatbuffers::FlatBufferBuilder fbb;
-
-  long long data_size_value;
-  if (RedisModule_StringToLongLong(data_size, &data_size_value) !=
-      REDISMODULE_OK) {
-    return RedisModule_ReplyWithError(ctx, "data_size must be integer");
-  }
-
-  std::vector<flatbuffers::Offset<flatbuffers::String>> manager_ids;
-  CHECK_ERROR(
-      RedisModule_ZsetFirstInScoreRange(key, REDISMODULE_NEGATIVE_INFINITE,
-                                        REDISMODULE_POSITIVE_INFINITE, 1, 1),
-      "Unable to initialize zset iterator");
-  /* Loop over the managers in the object table for this object ID. */
-  do {
-    RedisModuleString *curr = RedisModule_ZsetRangeCurrentElement(key, NULL);
-    manager_ids.push_back(RedisStringToFlatbuf(fbb, curr));
-  } while (RedisModule_ZsetRangeNext(key));
-
-  auto message = CreateSubscribeToNotificationsReply(
-      fbb, RedisStringToFlatbuf(fbb, object_id), data_size_value,
-      fbb.CreateVector(manager_ids));
-  fbb.Finish(message);
-
-  /* Publish the notification to the clients notification channel.
-   * TODO(rkn): These notifications could be batched together. */
-  RedisModuleString *channel_name =
-      RedisString_Format(ctx, "%s%S", OBJECT_CHANNEL_PREFIX, client_id);
-
-  RedisModuleString *payload = RedisModule_CreateString(
-      ctx, (const char *) fbb.GetBufferPointer(), fbb.GetSize());
-
-  RedisModuleCallReply *reply;
-  reply = RedisModule_Call(ctx, "PUBLISH", "ss", channel_name, payload);
-  if (reply == NULL) {
-    return false;
-  }
-  return true;
-}
-
-// NOTE(pcmoritz): This is a temporary redis command that will be removed once
-// the GCS uses https://github.com/pcmoritz/credis.
-int PublishTaskTableAdd(RedisModuleCtx *ctx,
-                        RedisModuleString *id,
-                        RedisModuleString *data) {
-  const char *buf = RedisModule_StringPtrLen(data, NULL);
-  auto message = flatbuffers::GetRoot<TaskTableData>(buf);
-  RAY_CHECK(message != nullptr);
-
-  if (message->scheduling_state() == SchedulingState::WAITING ||
-      message->scheduling_state() == SchedulingState::SCHEDULED) {
-    /* Build the PUBLISH topic and message for task table subscribers. The
-     * topic
-     * is a string in the format "TASK_PREFIX:<local scheduler ID>:<state>".
-     * The
-     * message is a serialized SubscribeToTasksReply flatbuffer object. */
-    std::string state =
-        std::to_string(static_cast<int>(message->scheduling_state()));
-    RedisModuleString *publish_topic = RedisString_Format(
-        ctx, "%s%b:%s", TASK_PREFIX, message->scheduler_id()->str().data(),
-        sizeof(DBClientID), state.c_str());
-
-    /* Construct the flatbuffers object for the payload. */
-    flatbuffers::FlatBufferBuilder fbb;
-    /* Create the flatbuffers message. */
-    auto msg =
-        CreateTaskReply(fbb, RedisStringToFlatbuf(fbb, id),
-                        static_cast<long long>(message->scheduling_state()),
-                        fbb.CreateString(message->scheduler_id()),
-                        fbb.CreateString(message->execution_dependencies()),
-                        fbb.CreateString(message->task_info()),
-                        message->spillback_count(), true /* not used */);
-    fbb.Finish(msg);
-
-    RedisModuleString *publish_message = RedisModule_CreateString(
-        ctx, (const char *) fbb.GetBufferPointer(), fbb.GetSize());
-
-    RedisModuleCallReply *reply =
-        RedisModule_Call(ctx, "PUBLISH", "ss", publish_topic, publish_message);
-
-    /* See how many clients received this publish. */
-    long long num_clients = RedisModule_CallReplyInteger(reply);
-    RAY_CHECK(num_clients <= 1) << "Published to " << num_clients
-                                << " clients.";
-  }
-  return RedisModule_ReplyWithSimpleString(ctx, "OK");
-}
-
-/// Publish a notification for a new entry at a key. This publishes a
-/// notification to all subscribers of the table, as well as every client that
-/// has requested notifications for this key.
-///
-/// \param pubsub_channel_str The pubsub channel name that notifications for
-///        this key should be published to. When publishing to a specific
-///        client, the channel name should be <pubsub_channel>:<client_id>.
-/// \param id The ID of the key that the notification is about.
-/// \param data The data to publish.
-/// \return OK if there is no error during a publish.
-int PublishTableAdd(RedisModuleCtx *ctx,
-                    RedisModuleString *pubsub_channel_str,
-                    RedisModuleString *id,
-                    RedisModuleString *data) {
-  // Serialize the notification to send.
-  flatbuffers::FlatBufferBuilder fbb;
-  auto data_flatbuf = RedisStringToFlatbuf(fbb, data);
-  auto message = CreateGcsTableEntry(fbb, RedisStringToFlatbuf(fbb, id),
-                                     fbb.CreateVector(&data_flatbuf, 1));
-  fbb.Finish(message);
-
-  // Write the data back to any subscribers that are listening to all table
-  // notifications.
-  RedisModuleCallReply *reply =
-      RedisModule_Call(ctx, "PUBLISH", "sb", pubsub_channel_str,
-                       fbb.GetBufferPointer(), fbb.GetSize());
-  if (reply == NULL) {
-    return RedisModule_ReplyWithError(ctx, "error during PUBLISH");
-  }
-
-  // Publish the data to any clients who requested notifications on this key.
-  RedisModuleKey *notification_key = OpenBroadcastKey(
-      ctx, pubsub_channel_str, id, REDISMODULE_READ | REDISMODULE_WRITE);
-  if (RedisModule_KeyType(notification_key) != REDISMODULE_KEYTYPE_EMPTY) {
-    // NOTE(swang): Sets are not implemented yet, so we use ZSETs instead.
-    CHECK_ERROR(RedisModule_ZsetFirstInScoreRange(
-                    notification_key, REDISMODULE_NEGATIVE_INFINITE,
-                    REDISMODULE_POSITIVE_INFINITE, 1, 1),
-                "Unable to initialize zset iterator");
-    for (; !RedisModule_ZsetRangeEndReached(notification_key);
-         RedisModule_ZsetRangeNext(notification_key)) {
-      RedisModuleString *client_channel =
-          RedisModule_ZsetRangeCurrentElement(notification_key, NULL);
-      RedisModuleCallReply *reply =
-          RedisModule_Call(ctx, "PUBLISH", "sb", client_channel,
-                           fbb.GetBufferPointer(), fbb.GetSize());
-      if (reply == NULL) {
-        return RedisModule_ReplyWithError(ctx, "error during PUBLISH");
-      }
-    }
-  }
-  return RedisModule_ReplyWithSimpleString(ctx, "OK");
-}
-
-// RAY.TABLE_ADD:
-//   TableAdd_RedisCommand: the actual command handler.
-//   (helper) TableAdd_DoWrite: performs the write to redis state.
-//   (helper) TableAdd_DoPublish: performs a publish after the write.
-//   ChainTableAdd_RedisCommand: the same command, chain-enabled.
-
-int TableAdd_DoWrite(RedisModuleCtx *ctx,
-                     RedisModuleString **argv,
-                     int argc,
-                     RedisModuleString **mutated_key_str) {
-  if (argc != 5) {
-    return RedisModule_WrongArity(ctx);
-  }
-  RedisModuleString *prefix_str = argv[1];
-  RedisModuleString *id = argv[3];
-  RedisModuleString *data = argv[4];
-
-  RedisModuleKey *key =
-      OpenPrefixedKey(ctx, prefix_str, id, REDISMODULE_READ | REDISMODULE_WRITE,
-                      mutated_key_str);
-  RedisModule_StringSet(key, data);
-  return REDISMODULE_OK;
-}
-
-int TableAdd_DoPublish(RedisModuleCtx *ctx,
-                       RedisModuleString **argv,
-                       int argc) {
-  if (argc != 5) {
-    return RedisModule_WrongArity(ctx);
-  }
-  RedisModuleString *pubsub_channel_str = argv[2];
-  RedisModuleString *id = argv[3];
-  RedisModuleString *data = argv[4];
-
-  TablePubsub pubsub_channel = ParseTablePubsub(pubsub_channel_str);
-
-  if (pubsub_channel == TablePubsub::TASK) {
-    // Publish the task to its subscribers.
-    // TODO(swang): This is only necessary for legacy Ray and should be removed
-    // once we switch to using the new GCS API for the task table.
-    return PublishTaskTableAdd(ctx, id, data);
-  } else if (pubsub_channel != TablePubsub::NO_PUBLISH) {
-    // All other pubsub channels write the data back directly onto the channel.
-    return PublishTableAdd(ctx, pubsub_channel_str, id, data);
-  } else {
-    return RedisModule_ReplyWithSimpleString(ctx, "OK");
-  }
-}
-
-/// Add an entry at a key. This overwrites any existing data at the key.
-/// Publishes a notification about the update to all subscribers, if a pubsub
-/// channel is provided.
-///
-/// This is called from a client with the command:
-///
-///    RAY.TABLE_ADD <table_prefix> <pubsub_channel> <id> <data>
-///
-/// \param table_prefix The prefix string for keys in this table.
-/// \param pubsub_channel The pubsub channel name that notifications for
-///  this key should be published to. When publishing to a specific
-///  client, the channel name should be <pubsub_channel>:<client_id>.
-/// \param id The ID of the key to set.
-/// \param data The data to insert at the key.
-/// \return The current value at the key, or OK if there is no value.
-int TableAdd_RedisCommand(RedisModuleCtx *ctx,
-                          RedisModuleString **argv,
-                          int argc) {
-  RedisModule_AutoMemory(ctx);
-  TableAdd_DoWrite(ctx, argv, argc, /*mutated_key_str=*/nullptr);
-  return TableAdd_DoPublish(ctx, argv, argc);
-}
-
-#if RAY_USE_NEW_GCS
-int ChainTableAdd_RedisCommand(RedisModuleCtx *ctx,
-                               RedisModuleString **argv,
-                               int argc) {
-  RedisModule_AutoMemory(ctx);
-  return module.ChainReplicate(ctx, argv, argc, /*node_func=*/TableAdd_DoWrite,
-                               /*tail_func=*/TableAdd_DoPublish);
-}
-#endif
-
-int TableAppend_DoWrite(RedisModuleCtx *ctx,
-                        RedisModuleString **argv,
-                        int argc,
-                        RedisModuleString **mutated_key_str) {
-  if (argc < 5 || argc > 6) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  RedisModuleString *prefix_str = argv[1];
-  RedisModuleString *id = argv[3];
-  RedisModuleString *data = argv[4];
-  RedisModuleString *index_str = nullptr;
-  if (argc == 6) {
-    index_str = argv[5];
-  }
-
-  // Set the keys in the table.
-  RedisModuleKey *key =
-      OpenPrefixedKey(ctx, prefix_str, id, REDISMODULE_READ | REDISMODULE_WRITE,
-                      mutated_key_str);
-  // Determine the index at which the data should be appended. If no index is
-  // requested, then is the current length of the log.
-  size_t index = RedisModule_ValueLength(key);
-  if (index_str != nullptr) {
-    // Parse the requested index.
-    long long requested_index;
-    RAY_CHECK(RedisModule_StringToLongLong(index_str, &requested_index) ==
-              REDISMODULE_OK);
-    RAY_CHECK(requested_index >= 0);
-    index = static_cast<size_t>(requested_index);
-  }
-  // Only perform the append if the requested index matches the current length
-  // of the log, or if no index was requested.
-  if (index == RedisModule_ValueLength(key)) {
-    // The requested index matches the current length of the log or no index
-    // was requested. Perform the append.
-    int flags = REDISMODULE_ZADD_NX;
-    RedisModule_ZsetAdd(key, index, data, &flags);
-    // Check that we actually add a new entry during the append. This is only
-    // necessary since we implement the log with a sorted set, so all entries
-    // must be unique, or else we will have gaps in the log.
-    // TODO(rkn): We need to get rid of this uniqueness requirement. We can
-    // easily have multiple log events with the same message.
-    RAY_CHECK(flags == REDISMODULE_ZADD_ADDED) << "Appended a duplicate entry";
-    return REDISMODULE_OK;
-  } else {
-    // The requested index did not match the current length of the log. Return
-    // an error message as a string.
-    static const char *reply = "ERR entry exists";
-    RedisModule_ReplyWithStringBuffer(ctx, reply, strlen(reply));
-    return REDISMODULE_ERR;
-  }
-}
-
-int TableAppend_DoPublish(RedisModuleCtx *ctx,
-                          RedisModuleString **argv,
-                          int /*argc*/) {
-  RedisModuleString *pubsub_channel_str = argv[2];
-  RedisModuleString *id = argv[3];
-  RedisModuleString *data = argv[4];
-  // Publish a message on the requested pubsub channel if necessary.
-  TablePubsub pubsub_channel = ParseTablePubsub(pubsub_channel_str);
-  if (pubsub_channel != TablePubsub::NO_PUBLISH) {
-    // All other pubsub channels write the data back directly onto the
-    // channel.
-    return PublishTableAdd(ctx, pubsub_channel_str, id, data);
-  } else {
-    return RedisModule_ReplyWithSimpleString(ctx, "OK");
-  }
-}
-
-/// Append an entry to the log stored at a key. Publishes a notification about
-/// the update to all subscribers, if a pubsub channel is provided.
-///
-/// This is called from a client with the command:
-//
-///    RAY.TABLE_APPEND <table_prefix> <pubsub_channel> <id> <data>
-///                     <index (optional)>
-///
-/// \param table_prefix The prefix string for keys in this table.
-/// \param pubsub_channel The pubsub channel name that notifications for
-///        this key should be published to. When publishing to a specific
-///        client, the channel name should be <pubsub_channel>:<client_id>.
-/// \param id The ID of the key to append to.
-/// \param data The data to append to the key.
-/// \param index If this is set, then the data must be appended at this index.
-///        If the current log is shorter or longer than the requested index,
-///        then the append will fail and an error message will be returned as a
-///        string.
-/// \return OK if the append succeeds, or an error message string if the append
-///         fails.
-int TableAppend_RedisCommand(RedisModuleCtx *ctx,
-                             RedisModuleString **argv,
-                             int argc) {
-  RedisModule_AutoMemory(ctx);
-  const int status = TableAppend_DoWrite(ctx, argv, argc,
-                                         /*mutated_key_str=*/nullptr);
-  if (status) {
-    return status;
-  }
-  return TableAppend_DoPublish(ctx, argv, argc);
-}
-
-#if RAY_USE_NEW_GCS
-int ChainTableAppend_RedisCommand(RedisModuleCtx *ctx,
-                                  RedisModuleString **argv,
-                                  int argc) {
-  RedisModule_AutoMemory(ctx);
-  return module.ChainReplicate(ctx, argv, argc,
-                               /*node_func=*/TableAppend_DoWrite,
-                               /*tail_func=*/TableAppend_DoPublish);
-}
-#endif
-
-/// A helper function to create and finish a GcsTableEntry, based on the
-/// current value or values at the given key.
-void TableEntryToFlatbuf(RedisModuleKey *table_key,
-                         RedisModuleString *entry_id,
-                         flatbuffers::FlatBufferBuilder &fbb) {
-  auto key_type = RedisModule_KeyType(table_key);
-  switch (key_type) {
-  case REDISMODULE_KEYTYPE_STRING: {
-    // Build the flatbuffer from the string data.
-    size_t data_len = 0;
-    char *data_buf =
-        RedisModule_StringDMA(table_key, &data_len, REDISMODULE_READ);
-    auto data = fbb.CreateString(data_buf, data_len);
-    auto message = CreateGcsTableEntry(fbb, RedisStringToFlatbuf(fbb, entry_id),
-                                       fbb.CreateVector(&data, 1));
-    fbb.Finish(message);
-  } break;
-  case REDISMODULE_KEYTYPE_ZSET: {
-    // Build the flatbuffer from the set of log entries.
-    RAY_CHECK(RedisModule_ZsetFirstInScoreRange(
-                  table_key, REDISMODULE_NEGATIVE_INFINITE,
-                  REDISMODULE_POSITIVE_INFINITE, 1, 1) == REDISMODULE_OK);
-    std::vector<flatbuffers::Offset<flatbuffers::String>> data;
-    for (; !RedisModule_ZsetRangeEndReached(table_key);
-         RedisModule_ZsetRangeNext(table_key)) {
-      data.push_back(RedisStringToFlatbuf(
-          fbb, RedisModule_ZsetRangeCurrentElement(table_key, NULL)));
-    }
-    auto message = CreateGcsTableEntry(fbb, RedisStringToFlatbuf(fbb, entry_id),
-                                       fbb.CreateVector(data));
-    fbb.Finish(message);
-  } break;
-  case REDISMODULE_KEYTYPE_EMPTY: {
-    auto message = CreateGcsTableEntry(
-        fbb, RedisStringToFlatbuf(fbb, entry_id),
-        fbb.CreateVector(
-            std::vector<flatbuffers::Offset<flatbuffers::String>>()));
-    fbb.Finish(message);
-  } break;
-  default:
-    RAY_LOG(FATAL) << "Invalid Redis type during lookup: " << key_type;
-  }
-}
-
-/// Lookup the current value or values at a key. Returns the current value or
-/// values at the key.
-///
-/// This is called from a client with the command:
-//
-///    RAY.TABLE_LOOKUP <table_prefix> <pubsub_channel> <id>
-///
-/// \param table_prefix The prefix string for keys in this table.
-/// \param pubsub_channel The pubsub channel name that notifications for
-///        this key should be published to. This field is unused for lookups.
-/// \param id The ID of the key to lookup.
-/// \return nil if the key is empty, the current value if the key type is a
-///         string, or an array of the current values if the key type is a set.
-int TableLookup_RedisCommand(RedisModuleCtx *ctx,
-                             RedisModuleString **argv,
-                             int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc < 4) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  RedisModuleString *prefix_str = argv[1];
-  RedisModuleString *id = argv[3];
-
-  // Lookup the data at the key.
-  RedisModuleKey *table_key =
-      OpenPrefixedKey(ctx, prefix_str, id, REDISMODULE_READ);
-  if (table_key == nullptr) {
-    RedisModule_ReplyWithNull(ctx);
-  } else {
-    // Serialize the data to a flatbuffer to return to the client.
-    flatbuffers::FlatBufferBuilder fbb;
-    TableEntryToFlatbuf(table_key, id, fbb);
-    RedisModule_ReplyWithStringBuffer(
-        ctx, reinterpret_cast<const char *>(fbb.GetBufferPointer()),
-        fbb.GetSize());
-  }
-  return REDISMODULE_OK;
-}
-
-/// Request notifications for changes to a key. Returns the current value or
-/// values at the key. Notifications will be sent to the requesting client for
-/// every subsequent TABLE_ADD to the key.
-///
-/// This is called from a client with the command:
-//
-///    RAY.TABLE_REQUEST_NOTIFICATIONS <table_prefix> <pubsub_channel> <id>
-///        <client_id>
-///
-/// \param table_prefix The prefix string for keys in this table.
-/// \param pubsub_channel The pubsub channel name that notifications for
-///        this key should be published to. When publishing to a specific
-///        client, the channel name should be <pubsub_channel>:<client_id>.
-/// \param id The ID of the key to publish notifications for.
-/// \param client_id The ID of the client that is being notified.
-/// \return nil if the key is empty, the current value if the key type is a
-///         string, or an array of the current values if the key type is a set.
-int TableRequestNotifications_RedisCommand(RedisModuleCtx *ctx,
-                                           RedisModuleString **argv,
-                                           int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc != 5) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  RedisModuleString *prefix_str = argv[1];
-  RedisModuleString *pubsub_channel_str = argv[2];
-  RedisModuleString *id = argv[3];
-  RedisModuleString *client_id = argv[4];
-  RedisModuleString *client_channel =
-      FormatPubsubChannel(ctx, pubsub_channel_str, client_id);
-
-  // Add this client to the set of clients that should be notified when there
-  // are changes to the key.
-  RedisModuleKey *notification_key = OpenBroadcastKey(
-      ctx, pubsub_channel_str, id, REDISMODULE_READ | REDISMODULE_WRITE);
-  CHECK_ERROR(RedisModule_ZsetAdd(notification_key, 0.0, client_channel, NULL),
-              "ZsetAdd failed.");
-
-  // Lookup the current value at the key.
-  RedisModuleKey *table_key =
-      OpenPrefixedKey(ctx, prefix_str, id, REDISMODULE_READ);
-  // Publish the current value at the key to the client that is requesting
-  // notifications. An empty notification will be published if the key is
-  // empty.
-  flatbuffers::FlatBufferBuilder fbb;
-  TableEntryToFlatbuf(table_key, id, fbb);
-  RedisModule_Call(ctx, "PUBLISH", "sb", client_channel,
-                   reinterpret_cast<const char *>(fbb.GetBufferPointer()),
-                   fbb.GetSize());
-
-  return RedisModule_ReplyWithNull(ctx);
-}
-
-/// Cancel notifications for changes to a key. The client will no longer
-/// receive notifications for this key. This does not check if the client
-/// first requested notifications before canceling them.
-///
-/// This is called from a client with the command:
-//
-///    RAY.TABLE_CANCEL_NOTIFICATIONS <table_prefix> <pubsub_channel> <id>
-///        <client_id>
-///
-/// \param table_prefix The prefix string for keys in this table.
-/// \param pubsub_channel The pubsub channel name that notifications for
-///        this key should be published to. If publishing to a specific client,
-///        then the channel name should be <pubsub_channel>:<client_id>.
-/// \param id The ID of the key to publish notifications for.
-/// \param client_id The ID of the client to cancel notifications for.
-/// \return OK.
-int TableCancelNotifications_RedisCommand(RedisModuleCtx *ctx,
-                                          RedisModuleString **argv,
-                                          int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc < 5) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  RedisModuleString *pubsub_channel_str = argv[2];
-  RedisModuleString *id = argv[3];
-  RedisModuleString *client_id = argv[4];
-  RedisModuleString *client_channel =
-      FormatPubsubChannel(ctx, pubsub_channel_str, client_id);
-
-  // Remove this client from the set of clients that should be notified when
-  // there are changes to the key.
-  RedisModuleKey *notification_key = OpenBroadcastKey(
-      ctx, pubsub_channel_str, id, REDISMODULE_READ | REDISMODULE_WRITE);
-  if (RedisModule_KeyType(notification_key) != REDISMODULE_KEYTYPE_EMPTY) {
-    RAY_CHECK(RedisModule_ZsetRem(notification_key, client_channel, NULL) ==
-              REDISMODULE_OK);
-  }
-
-  RedisModule_ReplyWithSimpleString(ctx, "OK");
-  return REDISMODULE_OK;
-}
-
-bool is_nil(const std::string &data) {
-  RAY_CHECK(data.size() == kUniqueIDSize);
-  const uint8_t *d = reinterpret_cast<const uint8_t *>(data.data());
-  for (int i = 0; i < kUniqueIDSize; ++i) {
-    if (d[i] != 255) {
-      return false;
-    }
-  }
-  return true;
-}
-
-// This is a temporary redis command that will be removed once
-// the GCS uses https://github.com/pcmoritz/credis.
-// Be careful, this only supports Task Table payloads.
-int TableTestAndUpdate_RedisCommand(RedisModuleCtx *ctx,
-                                    RedisModuleString **argv,
-                                    int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc != 5) {
-    return RedisModule_WrongArity(ctx);
-  }
-  RedisModuleString *prefix_str = argv[1];
-  RedisModuleString *id = argv[3];
-  RedisModuleString *update_data = argv[4];
-
-  RedisModuleKey *key = OpenPrefixedKey(ctx, prefix_str, id,
-                                        REDISMODULE_READ | REDISMODULE_WRITE);
-
-  size_t value_len = 0;
-  char *value_buf = RedisModule_StringDMA(key, &value_len, REDISMODULE_READ);
-
-  size_t update_len = 0;
-  const char *update_buf = RedisModule_StringPtrLen(update_data, &update_len);
-
-  auto data = flatbuffers::GetMutableRoot<TaskTableData>(
-      reinterpret_cast<void *>(value_buf));
-
-  auto update = flatbuffers::GetRoot<TaskTableTestAndUpdate>(update_buf);
-
-  bool do_update = static_cast<int>(data->scheduling_state()) &
-                   static_cast<int>(update->test_state_bitmask());
-
-  if (!is_nil(update->test_scheduler_id()->str())) {
-    do_update =
-        do_update &&
-        update->test_scheduler_id()->str() == data->scheduler_id()->str();
-  }
-
-  if (do_update) {
-    RAY_CHECK(data->mutate_scheduling_state(update->update_state()));
-  }
-  RAY_CHECK(data->mutate_updated(do_update));
-
-  int result = RedisModule_ReplyWithStringBuffer(ctx, value_buf, value_len);
-
-  return result;
-}
-
-/**
- * Add a new entry to the object table or update an existing one.
- *
- * This is called from a client with the command:
- *
- *     RAY.OBJECT_TABLE_ADD <object id> <data size> <hash string> <manager id>
- *
- * @param object_id A string representing the object ID.
- * @param data_size An integer which is the object size in bytes.
- * @param hash_string A string which is a hash of the object.
- * @param manager A string which represents the manager ID of the plasma manager
- *        that has the object.
- * @return OK if the operation was successful. If the same object_id is already
- *         present with a different hash value, the entry is still added, but
- *         an error with string "hash mismatch" is returned.
- */
-int ObjectTableAdd_RedisCommand(RedisModuleCtx *ctx,
-                                RedisModuleString **argv,
-                                int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc != 5) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  RedisModuleString *object_id = argv[1];
-  RedisModuleString *data_size = argv[2];
-  RedisModuleString *new_hash = argv[3];
-  RedisModuleString *manager = argv[4];
-
-  long long data_size_value;
-  if (RedisModule_StringToLongLong(data_size, &data_size_value) !=
-      REDISMODULE_OK) {
-    return RedisModule_ReplyWithError(ctx, "data_size must be integer");
-  }
-
-  /* Set the fields in the object info table. */
-  RedisModuleKey *key;
-  key = OpenPrefixedKey(ctx, OBJECT_INFO_PREFIX, object_id,
-                        REDISMODULE_READ | REDISMODULE_WRITE);
-
-  /* Check if this object was already registered and if the hashes agree. */
-  bool hash_mismatch = false;
-  if (RedisModule_KeyType(key) != REDISMODULE_KEYTYPE_EMPTY) {
-    RedisModuleString *existing_hash;
-    RedisModule_HashGet(key, REDISMODULE_HASH_CFIELDS, "hash", &existing_hash,
-                        NULL);
-    /* The existing hash may be NULL even if the key is present because a call
-     * to RAY.RESULT_TABLE_ADD may have already created the key. */
-    if (existing_hash != NULL) {
-      /* Check whether the new hash value matches the old one. If not, we will
-       * later return the "hash mismatch" error. */
-      hash_mismatch = (RedisModule_StringCompare(existing_hash, new_hash) != 0);
-    }
-  }
-
-  RedisModule_HashSet(key, REDISMODULE_HASH_CFIELDS, "hash", new_hash, NULL);
-  RedisModule_HashSet(key, REDISMODULE_HASH_CFIELDS, "data_size", data_size,
-                      NULL);
-
-  /* Add the location in the object location table. */
-  RedisModuleKey *table_key;
-  table_key = OpenPrefixedKey(ctx, OBJECT_LOCATION_PREFIX, object_id,
-                              REDISMODULE_READ | REDISMODULE_WRITE);
-
-  /* Sets are not implemented yet, so we use ZSETs instead. */
-  RedisModule_ZsetAdd(table_key, 0.0, manager, NULL);
-
-  RedisModuleString *bcast_client_str =
-      RedisModule_CreateString(ctx, OBJECT_BCAST, strlen(OBJECT_BCAST));
-  bool success = PublishObjectNotification(ctx, bcast_client_str, object_id,
-                                           data_size, table_key);
-  if (!success) {
-    /* The publish failed somehow. */
-    return RedisModule_ReplyWithError(ctx, "PUBLISH BCAST unsuccessful");
-  }
-
-  /* Get the zset of clients that requested a notification about the
-   * availability of this object. */
-  RedisModuleKey *object_notification_key =
-      OpenPrefixedKey(ctx, OBJECT_NOTIFICATION_PREFIX, object_id,
-                      REDISMODULE_READ | REDISMODULE_WRITE);
-  /* If the zset exists, initialize the key to iterate over the zset. */
-  if (RedisModule_KeyType(object_notification_key) !=
-      REDISMODULE_KEYTYPE_EMPTY) {
-    CHECK_ERROR(RedisModule_ZsetFirstInScoreRange(
-                    object_notification_key, REDISMODULE_NEGATIVE_INFINITE,
-                    REDISMODULE_POSITIVE_INFINITE, 1, 1),
-                "Unable to initialize zset iterator");
-    /* Iterate over the list of clients that requested notifiations about the
-     * availability of this object, and publish notifications to their object
-     * notification channels. */
-
-    do {
-      RedisModuleString *client_id =
-          RedisModule_ZsetRangeCurrentElement(object_notification_key, NULL);
-      /* TODO(rkn): Some computation could be saved by batching the string
-       * constructions in the multiple calls to PublishObjectNotification
-       * together. */
-      bool success = PublishObjectNotification(ctx, client_id, object_id,
-                                               data_size, table_key);
-      if (!success) {
-        /* The publish failed somehow. */
-        return RedisModule_ReplyWithError(ctx, "PUBLISH unsuccessful");
-      }
-    } while (RedisModule_ZsetRangeNext(object_notification_key));
-    /* Now that the clients have been notified, remove the zset of clients
-     * waiting for notifications. */
-    CHECK_ERROR(RedisModule_DeleteKey(object_notification_key),
-                "Unable to delete zset key.");
-  }
-
-  if (hash_mismatch) {
-    return RedisModule_ReplyWithError(ctx, "hash mismatch");
-  } else {
-    RedisModule_ReplyWithSimpleString(ctx, "OK");
-    return REDISMODULE_OK;
-  }
-}
-
-/**
- * Remove a manager from a location entry in the object table.
- *
- * This is called from a client with the command:
- *
- *     RAY.OBJECT_TABLE_REMOVE <object id> <manager id>
- *
- * @param object_id A string representing the object ID.
- * @param manager A string which represents the manager ID of the plasma manager
- *        to remove.
- * @return OK if the operation was successful or an error with string
- *         "object not found" if the entry for the object_id doesn't exist. The
- *         operation is counted as a success if the manager was already not in
- *         the entry.
- */
-int ObjectTableRemove_RedisCommand(RedisModuleCtx *ctx,
-                                   RedisModuleString **argv,
-                                   int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc != 3) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  RedisModuleString *object_id = argv[1];
-  RedisModuleString *manager = argv[2];
-
-  /* Remove the location from the object location table. */
-  RedisModuleKey *table_key;
-  table_key = OpenPrefixedKey(ctx, OBJECT_LOCATION_PREFIX, object_id,
-                              REDISMODULE_READ | REDISMODULE_WRITE);
-  if (RedisModule_KeyType(table_key) == REDISMODULE_KEYTYPE_EMPTY) {
-    return RedisModule_ReplyWithError(ctx, "object not found");
-  }
-
-  RedisModule_ZsetRem(table_key, manager, NULL);
-
-  RedisModule_ReplyWithSimpleString(ctx, "OK");
-  return REDISMODULE_OK;
-}
-
-/**
- * Request notifications about the presence of some object IDs. This command
- * takes a list of object IDs. For each object ID, the reply will be the list
- * of plasma managers that contain the object. If the list of plasma managers
- * is currently nonempty, then the reply will happen immediately. Else, the
- * reply will come later, on the first invocation of `RAY.OBJECT_TABLE_ADD`
- * following this call.
- *
- * This is called from a client with the command:
- *
- *    RAY.OBJECT_TABLE_REQUEST_NOTIFICATIONS <client id> <object id1>
- *        <object id2> ...
- *
- * @param client_id The ID of the client that is requesting the notifications.
- * @param object_id(n) The ID of the nth object ID that is passed to this
- *        command. This command can take any number of object IDs.
- * @return OK if the operation was successful.
- */
-int ObjectTableRequestNotifications_RedisCommand(RedisModuleCtx *ctx,
-                                                 RedisModuleString **argv,
-                                                 int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc < 3) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  /* The first argument is the client ID. The other arguments are object IDs. */
-  RedisModuleString *client_id = argv[1];
-
-  /* Loop over the object ID arguments to this command. */
-  for (int i = 2; i < argc; ++i) {
-    RedisModuleString *object_id = argv[i];
-    RedisModuleKey *key = OpenPrefixedKey(ctx, OBJECT_LOCATION_PREFIX,
-                                          object_id, REDISMODULE_READ);
-    if (RedisModule_KeyType(key) == REDISMODULE_KEYTYPE_EMPTY ||
-        RedisModule_ValueLength(key) == 0) {
-      /* This object ID is currently not present, so make a note that this
-       * client should be notified when this object ID becomes available. */
-      RedisModuleKey *object_notification_key =
-          OpenPrefixedKey(ctx, OBJECT_NOTIFICATION_PREFIX, object_id,
-                          REDISMODULE_READ | REDISMODULE_WRITE);
-      /* Add this client to the list of clients that will be notified when this
-       * object becomes available. */
-      CHECK_ERROR(
-          RedisModule_ZsetAdd(object_notification_key, 0.0, client_id, NULL),
-          "ZsetAdd failed.");
-    } else {
-      /* Publish a notification to the client's object notification channel. */
-      /* Extract the data_size first. */
-      RedisModuleKey *object_info_key;
-      object_info_key =
-          OpenPrefixedKey(ctx, OBJECT_INFO_PREFIX, object_id, REDISMODULE_READ);
-      if (RedisModule_KeyType(key) == REDISMODULE_KEYTYPE_EMPTY) {
-        return RedisModule_ReplyWithError(ctx, "requested object not found");
-      }
-      RedisModuleString *existing_data_size;
-      RedisModule_HashGet(object_info_key, REDISMODULE_HASH_CFIELDS,
-                          "data_size", &existing_data_size, NULL);
-      if (existing_data_size == NULL) {
-        return RedisModule_ReplyWithError(ctx,
-                                          "no data_size field in object info");
-      }
-
-      bool success = PublishObjectNotification(ctx, client_id, object_id,
-                                               existing_data_size, key);
-      if (!success) {
-        /* The publish failed somehow. */
-        return RedisModule_ReplyWithError(ctx, "PUBLISH unsuccessful");
-      }
-    }
-  }
-
-  RedisModule_ReplyWithSimpleString(ctx, "OK");
-  return REDISMODULE_OK;
-}
-
-int ObjectInfoSubscribe_RedisCommand(RedisModuleCtx *ctx,
-                                     RedisModuleString **argv,
-                                     int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  REDISMODULE_NOT_USED(argv);
-  REDISMODULE_NOT_USED(argc);
-  return REDISMODULE_OK;
-}
-
-/**
- * Add a new entry to the result table or update an existing one.
- *
- * This is called from a client with the command:
- *
- *     RAY.RESULT_TABLE_ADD <object id> <task id> <is_put>
- *
- * @param object_id A string representing the object ID.
- * @param task_id A string representing the task ID of the task that produced
- *        the object.
- * @param is_put An integer that is 1 if the object was created through ray.put
- *        and 0 if created by return value.
- * @return OK if the operation was successful.
- */
-int ResultTableAdd_RedisCommand(RedisModuleCtx *ctx,
-                                RedisModuleString **argv,
-                                int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc != 4) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  /* Set the task ID under field "task" in the object info table. */
-  RedisModuleString *object_id = argv[1];
-  RedisModuleString *task_id = argv[2];
-  RedisModuleString *is_put = argv[3];
-
-  /* Check to make sure the is_put field was a 0 or a 1. */
-  long long is_put_integer;
-  if ((RedisModule_StringToLongLong(is_put, &is_put_integer) !=
-       REDISMODULE_OK) ||
-      (is_put_integer != 0 && is_put_integer != 1)) {
-    return RedisModule_ReplyWithError(
-        ctx, "The is_put field must be either a 0 or a 1.");
-  }
-
-  RedisModuleKey *key;
-  key = OpenPrefixedKey(ctx, OBJECT_INFO_PREFIX, object_id, REDISMODULE_WRITE);
-  RedisModule_HashSet(key, REDISMODULE_HASH_CFIELDS, "task", task_id, "is_put",
-                      is_put, NULL);
-
-  RedisModule_ReplyWithSimpleString(ctx, "OK");
-
-  return REDISMODULE_OK;
-}
-
-/**
- * Reply with information about a task ID. This is used by
- * RAY.RESULT_TABLE_LOOKUP and RAY.TASK_TABLE_GET.
- *
- * @param ctx The Redis context.
- * @param task_id The task ID of the task to reply about.
- * @param updated A boolean representing whether the task was updated during
- *        this operation. This field is only used for
- *        RAY.TASK_TABLE_TEST_AND_UPDATE operations.
- * @return NIL if the task ID is not in the task table. An error if the task ID
- *         is in the task table but the appropriate fields are not there, and
- *         an array of the task scheduling state, the local scheduler ID, and
- *         the task spec for the task otherwise.
- */
-int ReplyWithTask(RedisModuleCtx *ctx,
-                  RedisModuleString *task_id,
-                  bool updated) {
-  RedisModuleKey *key =
-      OpenPrefixedKey(ctx, TASK_PREFIX, task_id, REDISMODULE_READ);
-
-  if (RedisModule_KeyType(key) != REDISMODULE_KEYTYPE_EMPTY) {
-    /* If the key exists, look up the fields and return them in an array. */
-    RedisModuleString *state = NULL;
-    RedisModuleString *local_scheduler_id = NULL;
-    RedisModuleString *execution_dependencies = NULL;
-    RedisModuleString *task_spec = NULL;
-    RedisModuleString *spillback_count = NULL;
-    RedisModule_HashGet(
-        key, REDISMODULE_HASH_CFIELDS, "state", &state, "local_scheduler_id",
-        &local_scheduler_id, "execution_dependencies", &execution_dependencies,
-        "TaskSpec", &task_spec, "spillback_count", &spillback_count, NULL);
-    if (state == NULL || local_scheduler_id == NULL ||
-        execution_dependencies == NULL || task_spec == NULL ||
-        spillback_count == NULL) {
-      /* We must have either all fields or no fields. */
-      return RedisModule_ReplyWithError(
-          ctx, "Missing fields in the task table entry");
-    }
-
-    long long state_integer;
-    long long spillback_count_val;
-    if ((RedisModule_StringToLongLong(state, &state_integer) !=
-         REDISMODULE_OK) ||
-        (state_integer < 0) ||
-        (RedisModule_StringToLongLong(spillback_count, &spillback_count_val) !=
-         REDISMODULE_OK) ||
-        (spillback_count_val < 0)) {
-      return RedisModule_ReplyWithError(
-          ctx, "Found invalid scheduling state or spillback count.");
-    }
-
-    flatbuffers::FlatBufferBuilder fbb;
-    auto message = CreateTaskReply(
-        fbb, RedisStringToFlatbuf(fbb, task_id), state_integer,
-        RedisStringToFlatbuf(fbb, local_scheduler_id),
-        RedisStringToFlatbuf(fbb, execution_dependencies),
-        RedisStringToFlatbuf(fbb, task_spec), spillback_count_val, updated);
-    fbb.Finish(message);
-
-    RedisModuleString *reply = RedisModule_CreateString(
-        ctx, (char *) fbb.GetBufferPointer(), fbb.GetSize());
-    RedisModule_ReplyWithString(ctx, reply);
-  } else {
-    /* If the key does not exist, return nil. */
-    RedisModule_ReplyWithNull(ctx);
-  }
-
-  return REDISMODULE_OK;
-}
-
-/**
- * Lookup an entry in the result table.
- *
- * This is called from a client with the command:
- *
- *     RAY.RESULT_TABLE_LOOKUP <object id>
- *
- * @param object_id A string representing the object ID.
- * @return NIL if the object ID is not in the result table. Otherwise, this
- *         returns a ResultTableReply flatbuffer.
- */
-int ResultTableLookup_RedisCommand(RedisModuleCtx *ctx,
-                                   RedisModuleString **argv,
-                                   int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc != 2) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  /* Get the task ID under field "task" in the object info table. */
-  RedisModuleString *object_id = argv[1];
-
-  RedisModuleKey *key;
-  key = OpenPrefixedKey(ctx, OBJECT_INFO_PREFIX, object_id, REDISMODULE_READ);
-
-  if (RedisModule_KeyType(key) == REDISMODULE_KEYTYPE_EMPTY) {
-    return RedisModule_ReplyWithNull(ctx);
-  }
-
-  RedisModuleString *task_id;
-  RedisModuleString *is_put;
-  RedisModuleString *data_size;
-  RedisModuleString *hash;
-  RedisModule_HashGet(key, REDISMODULE_HASH_CFIELDS, "task", &task_id, "is_put",
-                      &is_put, "data_size", &data_size, "hash", &hash, NULL);
-
-  if (task_id == NULL || is_put == NULL) {
-    return RedisModule_ReplyWithNull(ctx);
-  }
-
-  /* Check to make sure the is_put field was a 0 or a 1. */
-  long long is_put_integer;
-  if (RedisModule_StringToLongLong(is_put, &is_put_integer) != REDISMODULE_OK ||
-      (is_put_integer != 0 && is_put_integer != 1)) {
-    return RedisModule_ReplyWithError(
-        ctx, "The is_put field must be either a 0 or a 1.");
-  }
-
-  /* Make and return the flatbuffer reply. */
-  flatbuffers::FlatBufferBuilder fbb;
-  long long data_size_value;
-
-  if (data_size == NULL) {
-    data_size_value = -1;
-  } else {
-    RedisModule_StringToLongLong(data_size, &data_size_value);
-    RAY_CHECK(RedisModule_StringToLongLong(data_size, &data_size_value) ==
-              REDISMODULE_OK);
-  }
-
-  flatbuffers::Offset<flatbuffers::String> hash_str;
-  if (hash == NULL) {
-    hash_str = fbb.CreateString("", strlen(""));
-  } else {
-    hash_str = RedisStringToFlatbuf(fbb, hash);
-  }
-
-  flatbuffers::Offset<ResultTableReply> message =
-      CreateResultTableReply(fbb, RedisStringToFlatbuf(fbb, task_id),
-                             bool(is_put_integer), data_size_value, hash_str);
-
-  fbb.Finish(message);
-  RedisModuleString *reply = RedisModule_CreateString(
-      ctx, (const char *) fbb.GetBufferPointer(), fbb.GetSize());
-  RedisModule_ReplyWithString(ctx, reply);
-
-  return REDISMODULE_OK;
-}
-
-int TaskTableWrite(RedisModuleCtx *ctx,
-                   RedisModuleString *task_id,
-                   RedisModuleString *state,
-                   RedisModuleString *local_scheduler_id,
-                   RedisModuleString *execution_dependencies,
-                   RedisModuleString *spillback_count,
-                   RedisModuleString *task_spec) {
-  /* Extract the scheduling state. */
-  long long state_value;
-  if (RedisModule_StringToLongLong(state, &state_value) != REDISMODULE_OK) {
-    return RedisModule_ReplyWithError(ctx, "scheduling state must be integer");
-  }
-
-  long long spillback_count_value;
-  if (RedisModule_StringToLongLong(spillback_count, &spillback_count_value) !=
-      REDISMODULE_OK) {
-    return RedisModule_ReplyWithError(ctx, "spillback count must be integer");
-  }
-  /* Add the task to the task table. If no spec was provided, get the existing
-   * spec out of the task table so we can publish it. */
-  RedisModuleString *existing_task_spec = NULL;
-  RedisModuleKey *key =
-      OpenPrefixedKey(ctx, TASK_PREFIX, task_id, REDISMODULE_WRITE);
-  if (task_spec == NULL) {
-    RedisModule_HashSet(key, REDISMODULE_HASH_CFIELDS, "state", state,
-                        "local_scheduler_id", local_scheduler_id,
-                        "execution_dependencies", execution_dependencies,
-                        "spillback_count", spillback_count, NULL);
-    RedisModule_HashGet(key, REDISMODULE_HASH_CFIELDS, "TaskSpec",
-                        &existing_task_spec, NULL);
-    if (existing_task_spec == NULL) {
-      return RedisModule_ReplyWithError(
-          ctx, "Cannot update a task that doesn't exist yet");
-    }
-  } else {
-    RedisModule_HashSet(
-        key, REDISMODULE_HASH_CFIELDS, "state", state, "local_scheduler_id",
-        local_scheduler_id, "execution_dependencies", execution_dependencies,
-        "TaskSpec", task_spec, "spillback_count", spillback_count, NULL);
-  }
-
-  if (static_cast<TaskStatus>(state_value) == TaskStatus::WAITING ||
-      static_cast<TaskStatus>(state_value) == TaskStatus::SCHEDULED) {
-    /* Build the PUBLISH topic and message for task table subscribers. The
-     * topic is a string in the format
-     * "TASK_PREFIX:<local scheduler ID>:<state>". The message is a serialized
-     * SubscribeToTasksReply flatbuffer object. */
-    RedisModuleString *publish_topic = RedisString_Format(
-        ctx, "%s%S:%S", TASK_PREFIX, local_scheduler_id, state);
-
-    /* Construct the flatbuffers object for the payload. */
-    flatbuffers::FlatBufferBuilder fbb;
-    /* Use the old task spec if the current one is NULL. */
-    RedisModuleString *task_spec_to_use;
-    if (task_spec != NULL) {
-      task_spec_to_use = task_spec;
-    } else {
-      task_spec_to_use = existing_task_spec;
-    }
-    /* Create the flatbuffers message. */
-    auto message = CreateTaskReply(
-        fbb, RedisStringToFlatbuf(fbb, task_id), state_value,
-        RedisStringToFlatbuf(fbb, local_scheduler_id),
-        RedisStringToFlatbuf(fbb, execution_dependencies),
-        RedisStringToFlatbuf(fbb, task_spec_to_use), spillback_count_value,
-        true);  // The updated field is not used.
-    fbb.Finish(message);
-
-    RedisModuleString *publish_message = RedisModule_CreateString(
-        ctx, (const char *) fbb.GetBufferPointer(), fbb.GetSize());
-
-    RedisModuleCallReply *reply =
-        RedisModule_Call(ctx, "PUBLISH", "ss", publish_topic, publish_message);
-
-    /* See how many clients received this publish. */
-    long long num_clients = RedisModule_CallReplyInteger(reply);
-    RAY_CHECK(num_clients <= 1) << "Published to " << num_clients
-                                << " clients.";
-
-    if (reply == NULL) {
-      return RedisModule_ReplyWithError(ctx, "PUBLISH unsuccessful");
-    }
-
-    if (num_clients == 0) {
-      /* This reply will be received by redis_task_table_update_callback or
-       * redis_task_table_add_task_callback in redis.cc, which will then reissue
-       * the command. */
-      return RedisModule_ReplyWithError(ctx,
-                                        "No subscribers received message.");
-    }
-  }
-
-  RedisModule_ReplyWithSimpleString(ctx, "OK");
-
-  return REDISMODULE_OK;
-}
-
-/**
- * Add a new entry to the task table. This will overwrite any existing entry
- * with the same task ID.
- *
- * This is called from a client with the command:
- *
- *     RAY.TASK_TABLE_ADD <task ID> <state> <local scheduler ID>
- *         <execution dependencies> <task spec>
- *
- * @param task_id A string that is the ID of the task.
- * @param state A string that is the current scheduling state (a
- *        scheduling_state enum instance).
- * @param local_scheduler_id A string that is the ray client ID of the
- *        associated local scheduler, if any.
- * @param execution_dependencies A string that is the list of execution
- *        dependencies.
- * @param task_spec A string that is the specification of the task, which can
- *        be cast to a `task_spec`.
- * @return OK if the operation was successful.
- */
-int TaskTableAddTask_RedisCommand(RedisModuleCtx *ctx,
-                                  RedisModuleString **argv,
-                                  int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc != 7) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  return TaskTableWrite(ctx, argv[1], argv[2], argv[3], argv[4], argv[5],
-                        argv[6]);
-}
-
-/**
- * Update an entry in the task table. This does not update the task
- * specification in the table.
- *
- * This is called from a client with the command:
- *
- *     RAY.TASK_TABLE_UPDATE <task ID> <state> <local scheduler ID>
- *         <execution dependencies>
- *
- * @param task_id A string that is the ID of the task.
- * @param state A string that is the current scheduling state (a
- *        scheduling_state enum instance).
- * @param ray_client_id A string that is the ray client ID of the associated
- *        local scheduler, if any.
- * @param execution_dependencies A string that is the list of execution
- *        dependencies.
- * @return OK if the operation was successful.
- */
-int TaskTableUpdate_RedisCommand(RedisModuleCtx *ctx,
-                                 RedisModuleString **argv,
-                                 int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc != 6) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  return TaskTableWrite(ctx, argv[1], argv[2], argv[3], argv[4], argv[5], NULL);
-}
-
-/**
- * Test and update an entry in the task table if the current value matches the
- * test value bitmask. This does not update the task specification in the
- * table.
- *
- * This is called from a client with the command:
- *
- *     RAY.TASK_TABLE_TEST_AND_UPDATE <task ID> <test state bitmask> <state>
- *         <local scheduler ID> <test local scheduler ID (optional)>
- *
- * @param task_id A string that is the ID of the task.
- * @param test_state_bitmask A string that is the test bitmask for the
- *        scheduling state. The update happens if and only if the current
- *        scheduling state AND-ed with the bitmask is greater than 0.
- * @param state A string that is the scheduling state (a scheduling_state enum
- *        instance) to update the task entry with.
- * @param ray_client_id A string that is the ray client ID of the associated
- *        local scheduler, if any, to update the task entry with.
- * @param test_local_scheduler_id A string to test the local scheduler ID. If
- *        provided, and if the current local scheduler ID does not match it,
- *        then the update does not happen.
- * @return Returns the task entry as a TaskReply. The reply will reflect the
- *         update, if it happened.
- */
-int TaskTableTestAndUpdate_RedisCommand(RedisModuleCtx *ctx,
-                                        RedisModuleString **argv,
-                                        int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc < 5 || argc > 6) {
-    return RedisModule_WrongArity(ctx);
-  }
-  /* If a sixth argument was provided, then we should also test the current
-   * local scheduler ID. */
-  bool test_local_scheduler = (argc == 6);
-
-  RedisModuleString *task_id = argv[1];
-  RedisModuleString *test_state = argv[2];
-  RedisModuleString *update_state = argv[3];
-  RedisModuleString *local_scheduler_id = argv[4];
-
-  RedisModuleKey *key = OpenPrefixedKey(ctx, TASK_PREFIX, task_id,
-                                        REDISMODULE_READ | REDISMODULE_WRITE);
-  if (RedisModule_KeyType(key) == REDISMODULE_KEYTYPE_EMPTY) {
-    return RedisModule_ReplyWithNull(ctx);
-  }
-
-  /* If the key exists, look up the fields and return them in an array. */
-  RedisModuleString *current_state = NULL;
-  RedisModuleString *current_local_scheduler_id = NULL;
-  RedisModule_HashGet(key, REDISMODULE_HASH_CFIELDS, "state", &current_state,
-                      "local_scheduler_id", &current_local_scheduler_id, NULL);
-
-  long long current_state_integer;
-  if (RedisModule_StringToLongLong(current_state, &current_state_integer) !=
-      REDISMODULE_OK) {
-    return RedisModule_ReplyWithError(ctx, "current_state must be integer");
-  }
-
-  if (current_state_integer < 0) {
-    return RedisModule_ReplyWithError(ctx, "Found invalid scheduling state.");
-  }
-  long long test_state_bitmask;
-  int status = RedisModule_StringToLongLong(test_state, &test_state_bitmask);
-  if (status != REDISMODULE_OK) {
-    return RedisModule_ReplyWithError(
-        ctx, "Invalid test value for scheduling state");
-  }
-
-  bool update = false;
-  if (current_state_integer & test_state_bitmask) {
-    if (test_local_scheduler) {
-      /* A test local scheduler ID was provided. Test whether it is equal to
-       * the current local scheduler ID before performing the update. */
-      RedisModuleString *test_local_scheduler_id = argv[5];
-      if (RedisModule_StringCompare(current_local_scheduler_id,
-                                    test_local_scheduler_id) == 0) {
-        /* If the current local scheduler ID does matches the test ID, then
-         * perform the update. */
-        update = true;
-      }
-    } else {
-      /* No test local scheduler ID was provided. Perform the update. */
-      update = true;
-    }
-  }
-
-  /* If the scheduling state and local scheduler ID tests passed, then perform
-   * the update. */
-  if (update) {
-    RedisModule_HashSet(key, REDISMODULE_HASH_CFIELDS, "state", update_state,
-                        "local_scheduler_id", local_scheduler_id, NULL);
-  }
-
-  /* Construct a reply by getting the task from the task ID. */
-  return ReplyWithTask(ctx, task_id, update);
-}
-
-/**
- * Get an entry from the task table.
- *
- * This is called from a client with the command:
- *
- *     RAY.TASK_TABLE_GET <task ID>
- *
- * @param task_id A string of the task ID to look up.
- * @return An array of strings representing the task fields in the following
- *         order: 1) (integer) scheduling state 2) (string) associated local
- *         scheduler ID, if any 3) (string) the task specification, which can be
- *         cast to a task_spec. If the task ID is not in the table, returns nil.
- */
-int TaskTableGet_RedisCommand(RedisModuleCtx *ctx,
-                              RedisModuleString **argv,
-                              int argc) {
-  RedisModule_AutoMemory(ctx);
-
-  if (argc != 2) {
-    return RedisModule_WrongArity(ctx);
-  }
-
-  /* Construct a reply by getting the task from the task ID. */
-  return ReplyWithTask(ctx, argv[1], false);
-}
-
-extern "C" {
-
-/* This function must be present on each Redis module. It is used in order to
- * register the commands into the Redis server. */
-int RedisModule_OnLoad(RedisModuleCtx *ctx,
-                       RedisModuleString **argv,
-                       int argc) {
-  REDISMODULE_NOT_USED(argv);
-  REDISMODULE_NOT_USED(argc);
-
-  if (RedisModule_Init(ctx, "ray", 1, REDISMODULE_APIVER_1) ==
-      REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.connect", Connect_RedisCommand,
-                                "write pubsub", 0, 0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.disconnect", Disconnect_RedisCommand,
-                                "write pubsub", 0, 0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.table_add", TableAdd_RedisCommand,
-                                "write pubsub", 0, 0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.table_append",
-                                TableAppend_RedisCommand, "write", 0, 0,
-                                0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.table_lookup",
-                                TableLookup_RedisCommand, "readonly", 0, 0,
-                                0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.table_request_notifications",
-                                TableRequestNotifications_RedisCommand,
-                                "write pubsub", 0, 0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.table_cancel_notifications",
-                                TableCancelNotifications_RedisCommand,
-                                "write pubsub", 0, 0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.table_test_and_update",
-                                TableTestAndUpdate_RedisCommand, "write", 0, 0,
-                                0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.object_table_lookup",
-                                ObjectTableLookup_RedisCommand, "readonly", 0,
-                                0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.object_table_add",
-                                ObjectTableAdd_RedisCommand, "write pubsub", 0,
-                                0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.object_table_remove",
-                                ObjectTableRemove_RedisCommand, "write", 0, 0,
-                                0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.object_table_request_notifications",
-                                ObjectTableRequestNotifications_RedisCommand,
-                                "write pubsub", 0, 0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.object_info_subscribe",
-                                ObjectInfoSubscribe_RedisCommand, "pubsub", 0,
-                                0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.result_table_add",
-                                ResultTableAdd_RedisCommand, "write", 0, 0,
-                                0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.result_table_lookup",
-                                ResultTableLookup_RedisCommand, "readonly", 0,
-                                0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.task_table_add",
-                                TaskTableAddTask_RedisCommand, "write pubsub",
-                                0, 0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.task_table_update",
-                                TaskTableUpdate_RedisCommand, "write pubsub", 0,
-                                0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.task_table_test_and_update",
-                                TaskTableTestAndUpdate_RedisCommand,
-                                "write pubsub", 0, 0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-  if (RedisModule_CreateCommand(ctx, "ray.task_table_get",
-                                TaskTableGet_RedisCommand, "readonly", 0, 0,
-                                0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-
-#if RAY_USE_NEW_GCS
-  // Chain-enabled commands that depend on ray-project/credis.
-  if (RedisModule_CreateCommand(ctx, "ray.chain.table_add",
-                                ChainTableAdd_RedisCommand, "write pubsub", 0,
-                                0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-  if (RedisModule_CreateCommand(ctx, "ray.chain.table_append",
-                                ChainTableAppend_RedisCommand, "write pubsub",
-                                0, 0, 0) == REDISMODULE_ERR) {
-    return REDISMODULE_ERR;
-  }
-#endif
-
-  return REDISMODULE_OK;
-}
-
-} /* extern "C" */
diff --git a/src/common/shims/windows/getopt.c b/src/common/shims/windows/getopt.c
deleted file mode 100644
index d9c4ae583307f..0000000000000
--- a/src/common/shims/windows/getopt.c
+++ /dev/null
@@ -1,69 +0,0 @@
-/* http://stackoverflow.com/a/17195644/541686 */
-
-#include <string.h>
-#include <stdio.h>
-
-int opterr = 1, /* if error message should be printed */
-    optind = 1, /* index into parent argv vector */
-    optopt,     /* character checked for validity */
-    optreset;   /* reset getopt */
-char *optarg;   /* argument associated with option */
-
-#define BADCH (int) '?'
-#define BADARG (int) ':'
-#define EMSG ""
-
-/*
-* getopt --
-*      Parse argc/argv argument vector.
-*/
-int getopt(int nargc, char *const nargv[], const char *ostr) {
-  static char *place = EMSG; /* option letter processing */
-  const char *oli;           /* option letter list index */
-
-  if (optreset || !*place) { /* update scanning pointer */
-    optreset = 0;
-    if (optind >= nargc || *(place = nargv[optind]) != '-') {
-      place = EMSG;
-      return (-1);
-    }
-    if (place[1] && *++place == '-') { /* found "--" */
-      ++optind;
-      place = EMSG;
-      return (-1);
-    }
-  } /* option letter okay? */
-  if ((optopt = (int) *place++) == (int) ':' || !(oli = strchr(ostr, optopt))) {
-    /*
-    * if the user didn't specify '-' as an option,
-    * assume it means -1.
-    */
-    if (optopt == (int) '-')
-      return (-1);
-    if (!*place)
-      ++optind;
-    if (opterr && *ostr != ':')
-      (void) printf("illegal option -- %c\n", optopt);
-    return (BADCH);
-  }
-  if (*++oli != ':') { /* don't need argument */
-    optarg = NULL;
-    if (!*place)
-      ++optind;
-  } else {      /* need an argument */
-    if (*place) /* no white space */
-      optarg = place;
-    else if (nargc <= ++optind) { /* no arg */
-      place = EMSG;
-      if (*ostr == ':')
-        return (BADARG);
-      if (opterr)
-        (void) printf("option requires an argument -- %c\n", optopt);
-      return (BADCH);
-    } else /* white space */
-      optarg = nargv[optind];
-    place = EMSG;
-    ++optind;
-  }
-  return (optopt); /* dump back option letter */
-}
diff --git a/src/common/shims/windows/getopt.h b/src/common/shims/windows/getopt.h
deleted file mode 100644
index 1870fb87f7930..0000000000000
--- a/src/common/shims/windows/getopt.h
+++ /dev/null
@@ -1,4 +0,0 @@
-#ifndef GETOPT_H
-#define GETOPT_H
-
-#endif /* GETOPT_H */
diff --git a/src/common/shims/windows/msg.c b/src/common/shims/windows/msg.c
deleted file mode 100644
index 5142c1aadf2ed..0000000000000
--- a/src/common/shims/windows/msg.c
+++ /dev/null
@@ -1,208 +0,0 @@
-#include <sys/socket.h>
-
-int socketpair(int domain, int type, int protocol, int sv[2]) {
-  if ((domain != AF_UNIX && domain != AF_INET) || type != SOCK_STREAM) {
-    return INVALID_SOCKET;
-  }
-  SOCKET sockets[2];
-  int r = dumb_socketpair(sockets);
-  sv[0] = (int) sockets[0];
-  sv[1] = (int) sockets[1];
-  return r;
-}
-
-#pragma comment(lib, "IPHlpAPI.lib")
-
-struct _MIB_TCPROW2 {
-  DWORD dwState, dwLocalAddr, dwLocalPort, dwRemoteAddr, dwRemotePort,
-      dwOwningPid;
-  enum _TCP_CONNECTION_OFFLOAD_STATE dwOffloadState;
-};
-
-struct _MIB_TCPTABLE2 {
-  DWORD dwNumEntries;
-  struct _MIB_TCPROW2 table[1];
-};
-
-DECLSPEC_IMPORT ULONG WINAPI GetTcpTable2(struct _MIB_TCPTABLE2 *TcpTable,
-                                          PULONG SizePointer,
-                                          BOOL Order);
-
-static DWORD getsockpid(SOCKET client) {
-  /* http://stackoverflow.com/a/25431340 */
-  DWORD pid = 0;
-
-  struct sockaddr_in Server = {0};
-  int ServerSize = sizeof(Server);
-
-  struct sockaddr_in Client = {0};
-  int ClientSize = sizeof(Client);
-
-  if ((getsockname(client, (struct sockaddr *) &Server, &ServerSize) == 0) &&
-      (getpeername(client, (struct sockaddr *) &Client, &ClientSize) == 0)) {
-    struct _MIB_TCPTABLE2 *TcpTable = NULL;
-    ULONG TcpTableSize = 0;
-    ULONG result;
-    do {
-      result = GetTcpTable2(TcpTable, &TcpTableSize, TRUE);
-      if (result != ERROR_INSUFFICIENT_BUFFER) {
-        break;
-      }
-      free(TcpTable);
-      TcpTable = (struct _MIB_TCPTABLE2 *) malloc(TcpTableSize);
-    } while (TcpTable != NULL);
-
-    if (result == NO_ERROR) {
-      for (DWORD dw = 0; dw < TcpTable->dwNumEntries; ++dw) {
-        struct _MIB_TCPROW2 *row = &(TcpTable->table[dw]);
-        if ((row->dwState == 5 /* MIB_TCP_STATE_ESTAB */) &&
-            (row->dwLocalAddr == Client.sin_addr.s_addr) &&
-            ((row->dwLocalPort & 0xFFFF) == Client.sin_port) &&
-            (row->dwRemoteAddr == Server.sin_addr.s_addr) &&
-            ((row->dwRemotePort & 0xFFFF) == Server.sin_port)) {
-          pid = row->dwOwningPid;
-          break;
-        }
-      }
-    }
-
-    free(TcpTable);
-  }
-
-  return pid;
-}
-
-ssize_t sendmsg(int sockfd, struct msghdr *msg, int flags) {
-  ssize_t result = -1;
-  struct cmsghdr *header = CMSG_FIRSTHDR(msg);
-  if (header->cmsg_level == SOL_SOCKET && header->cmsg_type == SCM_RIGHTS) {
-    /* We're trying to send over a handle of some kind.
-     * We have to look up which process we're communicating with,
-     * open a handle to it, and then duplicate our handle into it.
-     * However, the first two steps cannot be done atomically.
-     * Therefore, this code HAS A RACE CONDITIONS and is therefore NOT SECURE.
-     * In the absense of a malicious actor, though, it is exceedingly unlikely
-     * that the child process closes AND that its process ID is reassigned
-     * to another existing process.
-     */
-    struct msghdr const old_msg = *msg;
-    int *const pfd = (int *) CMSG_DATA(header);
-    msg->msg_control = NULL;
-    msg->msg_controllen = 0;
-    WSAPROTOCOL_INFO protocol_info = {0};
-    BOOL const is_socket = !!FDAPI_GetSocketStatePtr(*pfd);
-    DWORD const target_pid = getsockpid(sockfd);
-    HANDLE target_process = NULL;
-    if (target_pid) {
-      if (!is_socket) {
-        /* This is a regular handle... fit it into the same struct */
-        target_process = OpenProcess(PROCESS_DUP_HANDLE, FALSE, target_pid);
-        if (target_process) {
-          if (DuplicateHandle(GetCurrentProcess(), (HANDLE)(intptr_t) *pfd,
-                              target_process, (HANDLE *) &protocol_info, 0,
-                              TRUE, DUPLICATE_SAME_ACCESS)) {
-            result = 0;
-          }
-        }
-      } else {
-        /* This is a socket... */
-        result = FDAPI_WSADuplicateSocket(*pfd, target_pid, &protocol_info);
-      }
-    }
-    if (result == 0) {
-      int const nbufs = msg->dwBufferCount + 1;
-      WSABUF *const bufs =
-          (struct _WSABUF *) _alloca(sizeof(*msg->lpBuffers) * nbufs);
-      bufs[0].buf = (char *) &protocol_info;
-      bufs[0].len = sizeof(protocol_info);
-      memcpy(&bufs[1], msg->lpBuffers,
-             msg->dwBufferCount * sizeof(*msg->lpBuffers));
-      DWORD nb;
-      msg->lpBuffers = bufs;
-      msg->dwBufferCount = nbufs;
-      GUID const wsaid_WSASendMsg = {
-          0xa441e712,
-          0x754f,
-          0x43ca,
-          {0x84, 0xa7, 0x0d, 0xee, 0x44, 0xcf, 0x60, 0x6d}};
-      typedef INT PASCAL WSASendMsg_t(
-          SOCKET s, LPWSAMSG lpMsg, DWORD dwFlags, LPDWORD lpNumberOfBytesSent,
-          LPWSAOVERLAPPED lpOverlapped,
-          LPWSAOVERLAPPED_COMPLETION_ROUTINE lpCompletionRoutine);
-      WSASendMsg_t *WSASendMsg = NULL;
-      result = FDAPI_WSAIoctl(sockfd, SIO_GET_EXTENSION_FUNCTION_POINTER,
-                              &wsaid_WSASendMsg, sizeof(wsaid_WSASendMsg),
-                              &WSASendMsg, sizeof(WSASendMsg), &nb, NULL, 0);
-      if (result == 0) {
-        result = (*WSASendMsg)(sockfd, msg, flags, &nb, NULL, NULL) == 0
-                     ? (ssize_t)(nb - sizeof(protocol_info))
-                     : 0;
-      }
-    }
-    if (result != 0 && target_process && !is_socket) {
-      /* we failed to send the handle, and it needs cleaning up! */
-      HANDLE duplicated_back = NULL;
-      if (DuplicateHandle(target_process, *(HANDLE *) &protocol_info,
-                          GetCurrentProcess(), &duplicated_back, 0, FALSE,
-                          DUPLICATE_CLOSE_SOURCE)) {
-        CloseHandle(duplicated_back);
-      }
-    }
-    if (target_process) {
-      CloseHandle(target_process);
-    }
-    *msg = old_msg;
-  }
-  return result;
-}
-
-ssize_t recvmsg(int sockfd, struct msghdr *msg, int flags) {
-  int result = -1;
-  struct cmsghdr *header = CMSG_FIRSTHDR(msg);
-  if (msg->msg_controllen &&
-      flags == 0 /* We can't send flags on Windows... */) {
-    struct msghdr const old_msg = *msg;
-    msg->msg_control = NULL;
-    msg->msg_controllen = 0;
-    WSAPROTOCOL_INFO protocol_info = {0};
-    int const nbufs = msg->dwBufferCount + 1;
-    WSABUF *const bufs =
-        (struct _WSABUF *) _alloca(sizeof(*msg->lpBuffers) * nbufs);
-    bufs[0].buf = (char *) &protocol_info;
-    bufs[0].len = sizeof(protocol_info);
-    memcpy(&bufs[1], msg->lpBuffers,
-           msg->dwBufferCount * sizeof(*msg->lpBuffers));
-    typedef INT PASCAL WSARecvMsg_t(
-        SOCKET s, LPWSAMSG lpMsg, LPDWORD lpNumberOfBytesRecvd,
-        LPWSAOVERLAPPED lpOverlapped,
-        LPWSAOVERLAPPED_COMPLETION_ROUTINE lpCompletionRoutine);
-    WSARecvMsg_t *WSARecvMsg = NULL;
-    DWORD nb;
-    GUID const wsaid_WSARecvMsg = {
-        0xf689d7c8,
-        0x6f1f,
-        0x436b,
-        {0x8a, 0x53, 0xe5, 0x4f, 0xe3, 0x51, 0xc3, 0x22}};
-    result = FDAPI_WSAIoctl(sockfd, SIO_GET_EXTENSION_FUNCTION_POINTER,
-                            &wsaid_WSARecvMsg, sizeof(wsaid_WSARecvMsg),
-                            &WSARecvMsg, sizeof(WSARecvMsg), &nb, NULL, 0);
-    if (result == 0) {
-      result = (*WSARecvMsg)(sockfd, msg, &nb, NULL, NULL) == 0
-                   ? (ssize_t)(nb - sizeof(protocol_info))
-                   : 0;
-    }
-    if (result == 0) {
-      int *const pfd = (int *) CMSG_DATA(header);
-      if (protocol_info.iSocketType == 0 && protocol_info.iProtocol == 0) {
-        *pfd = *(int *) &protocol_info;
-      } else {
-        *pfd = FDAPI_WSASocket(FROM_PROTOCOL_INFO, FROM_PROTOCOL_INFO,
-                               FROM_PROTOCOL_INFO, &protocol_info, 0, 0);
-      }
-      header->cmsg_level = SOL_SOCKET;
-      header->cmsg_type = SCM_RIGHTS;
-    }
-    *msg = old_msg;
-  }
-  return result;
-}
diff --git a/src/common/shims/windows/netdb.h b/src/common/shims/windows/netdb.h
deleted file mode 100644
index 5dace165919a2..0000000000000
--- a/src/common/shims/windows/netdb.h
+++ /dev/null
@@ -1,4 +0,0 @@
-#ifndef NETDB_H
-#define NETDB_H
-
-#endif /* NETDB_H */
diff --git a/src/common/shims/windows/netinet/in.h b/src/common/shims/windows/netinet/in.h
deleted file mode 100644
index a60db3e05dd62..0000000000000
--- a/src/common/shims/windows/netinet/in.h
+++ /dev/null
@@ -1,4 +0,0 @@
-#ifndef IN_H
-#define IN_H
-
-#endif /* IN_H */
diff --git a/src/common/shims/windows/poll.h b/src/common/shims/windows/poll.h
deleted file mode 100644
index 058e23adee645..0000000000000
--- a/src/common/shims/windows/poll.h
+++ /dev/null
@@ -1,4 +0,0 @@
-#ifndef POLL_H
-#define POLL_H
-
-#endif /* POLL_H */
diff --git a/src/common/shims/windows/socketpair.c b/src/common/shims/windows/socketpair.c
deleted file mode 100644
index e9fc792c15a70..0000000000000
--- a/src/common/shims/windows/socketpair.c
+++ /dev/null
@@ -1,150 +0,0 @@
-/* socketpair.c
-Copyright 2007, 2010 by Nathan C. Myers <ncm@cantrip.org>
-Redistribution and use in source and binary forms, with or without modification,
-are permitted provided that the following conditions are met:
-
-    Redistributions of source code must retain the above copyright notice, this
-    list of conditions and the following disclaimer.
-
-    Redistributions in binary form must reproduce the above copyright notice,
-    this list of conditions and the following disclaimer in the documentation
-    and/or other materials provided with the distribution.
-
-    The name of the author must not be used to endorse or promote products
-    derived from this software without specific prior written permission.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
-AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
-IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
-FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
-DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
-SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
-CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
-OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
-OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- */
-
-/* Changes:
- * 2014-02-12: merge David Woodhouse, Ger Hobbelt improvements
- *     git.infradead.org/users/dwmw2/openconnect.git/commitdiff/bdeefa54
- *     github.com/GerHobbelt/selectable-socketpair
- *   always init the socks[] to -1/INVALID_SOCKET on error, both on Win32/64
- *   and UNIX/other platforms
- * 2013-07-18: Change to BSD 3-clause license
- * 2010-03-31:
- *   set addr to 127.0.0.1 because win32 getsockname does not always set it.
- * 2010-02-25:
- *   set SO_REUSEADDR option to avoid leaking some windows resource.
- *   Windows System Error 10049, "Event ID 4226 TCP/IP has reached
- *   the security limit imposed on the number of concurrent TCP connect
- *   attempts."  Bleah.
- * 2007-04-25:
- *   preserve value of WSAGetLastError() on all error returns.
- * 2007-04-22:  (Thanks to Matthew Gregan <kinetik@flim.org>)
- *   s/EINVAL/WSAEINVAL/ fix trivial compile failure
- *   s/socket/WSASocket/ enable creation of sockets suitable as stdin/stdout
- *     of a child process.
- *   add argument make_overlapped
- */
-
-#include <string.h>
-
-#ifdef WIN32
-#include <ws2tcpip.h> /* socklen_t, et al (MSVC20xx) */
-#include <windows.h>
-#include <io.h>
-#else
-#ifdef _WIN32
-#include <Win32_Interop/win32_types.h>
-#include <Win32_Interop/Win32_FDAPI.h>
-#endif
-#include <sys/types.h>
-#include <sys/socket.h>
-#include <errno.h>
-#endif
-
-#ifdef WIN32
-
-/* dumb_socketpair:
- *   If make_overlapped is nonzero, both sockets created will be usable for
- *   "overlapped" operations via WSASend etc.  If make_overlapped is zero,
- *   socks[0] (only) will be usable with regular ReadFile etc., and thus
- *   suitable for use as stdin or stdout of a child process.  Note that the
- *   sockets must be closed with closesocket() regardless.
- */
-
-int dumb_socketpair(SOCKET socks[2]) {
-  union {
-    struct sockaddr_in inaddr;
-    struct sockaddr addr;
-  } a;
-  SOCKET listener;
-  int e;
-  socklen_t addrlen = sizeof(a.inaddr);
-  int reuse = 1;
-
-  if (socks == 0) {
-    return SOCKET_ERROR;
-  }
-  socks[0] = socks[1] = -1;
-
-  listener = socket(AF_INET, SOCK_STREAM, IPPROTO_TCP);
-  if (listener == -1)
-    return SOCKET_ERROR;
-
-  memset(&a, 0, sizeof(a));
-  a.inaddr.sin_family = AF_INET;
-  a.inaddr.sin_addr.s_addr = htonl(INADDR_LOOPBACK);
-  a.inaddr.sin_port = 0;
-
-  for (;;) {
-    if (setsockopt(listener, SOL_SOCKET, SO_REUSEADDR, (char *) &reuse,
-                   (socklen_t) sizeof(reuse)) == -1)
-      break;
-    if (bind(listener, &a.addr, sizeof(a.inaddr)) == SOCKET_ERROR)
-      break;
-
-    memset(&a, 0, sizeof(a));
-    if (getsockname(listener, &a.addr, &addrlen) == SOCKET_ERROR)
-      break;
-    // win32 getsockname may only set the port number, p=0.0005.
-    // ( http://msdn.microsoft.com/library/ms738543.aspx ):
-    a.inaddr.sin_addr.s_addr = htonl(INADDR_LOOPBACK);
-    a.inaddr.sin_family = AF_INET;
-
-    if (listen(listener, 1) == SOCKET_ERROR)
-      break;
-
-    socks[0] = FDAPI_WSASocket(AF_INET, SOCK_STREAM, 0, NULL, 0, 0);
-    if (socks[0] == -1)
-      break;
-    if (connect(socks[0], &a.addr, sizeof(a.inaddr)) == SOCKET_ERROR)
-      break;
-
-    socks[1] = accept(listener, NULL, NULL);
-    if (socks[1] == -1)
-      break;
-
-    FDAPI_close(listener);
-    return 0;
-  }
-
-  FDAPI_close(listener);
-  FDAPI_close(socks[0]);
-  FDAPI_close(socks[1]);
-  socks[0] = socks[1] = -1;
-  return SOCKET_ERROR;
-}
-#else
-int dumb_socketpair(int socks[2], int dummy) {
-  if (socks == 0) {
-    errno = EINVAL;
-    return -1;
-  }
-  dummy = socketpair(AF_LOCAL, SOCK_STREAM, 0, socks);
-  if (dummy)
-    socks[0] = socks[1] = -1;
-  return dummy;
-}
-#endif
diff --git a/src/common/shims/windows/strings.h b/src/common/shims/windows/strings.h
deleted file mode 100644
index e264061c4e6ef..0000000000000
--- a/src/common/shims/windows/strings.h
+++ /dev/null
@@ -1,4 +0,0 @@
-#ifndef STRINGS_H
-#define STRINGS_H
-
-#endif /* STRINGS_H */
diff --git a/src/common/shims/windows/sys/ioctl.h b/src/common/shims/windows/sys/ioctl.h
deleted file mode 100644
index 00f7a55ed77dc..0000000000000
--- a/src/common/shims/windows/sys/ioctl.h
+++ /dev/null
@@ -1,4 +0,0 @@
-#ifndef IOCTL_H
-#define IOCTL_H
-
-#endif /* IOCTL_H */
diff --git a/src/common/shims/windows/sys/mman.h b/src/common/shims/windows/sys/mman.h
deleted file mode 100644
index a12df75fc7eac..0000000000000
--- a/src/common/shims/windows/sys/mman.h
+++ /dev/null
@@ -1,36 +0,0 @@
-#ifndef MMAN_H
-#define MMAN_H
-
-#include <unistd.h>
-
-#define MAP_SHARED 0x0010 /* share changes */
-#define MAP_FAILED ((void *) -1)
-#define PROT_READ 0x04  /* pages can be read */
-#define PROT_WRITE 0x02 /* pages can be written */
-#define PROT_EXEC 0x01  /* pages can be executed */
-
-static void *mmap(void *addr,
-                  size_t len,
-                  int prot,
-                  int flags,
-                  int fd,
-                  off_t off) {
-  void *result = (void *) (-1);
-  if (!addr && prot == MAP_SHARED) {
-    /* HACK: we're assuming handle sizes can't exceed 32 bits, which is wrong...
-     * but works for now. */
-    void *ptr = MapViewOfFile((HANDLE)(intptr_t) fd, FILE_MAP_ALL_ACCESS,
-                              (DWORD)(off >> (CHAR_BIT * sizeof(DWORD))),
-                              (DWORD) off, (SIZE_T) len);
-    if (ptr) {
-      result = ptr;
-    }
-  }
-  return result;
-}
-static int munmap(void *addr, size_t length) {
-  (void) length;
-  return UnmapViewOfFile(addr) ? 0 : -1;
-}
-
-#endif /* MMAN_H */
diff --git a/src/common/shims/windows/sys/select.h b/src/common/shims/windows/sys/select.h
deleted file mode 100644
index 8aef7950e3993..0000000000000
--- a/src/common/shims/windows/sys/select.h
+++ /dev/null
@@ -1,4 +0,0 @@
-#ifndef SELECT_H
-#define SELECT_H
-
-#endif /* SELECT_H */
diff --git a/src/common/shims/windows/sys/socket.h b/src/common/shims/windows/sys/socket.h
deleted file mode 100644
index ba9d656bb96d9..0000000000000
--- a/src/common/shims/windows/sys/socket.h
+++ /dev/null
@@ -1,36 +0,0 @@
-#ifndef SOCKET_H
-#define SOCKET_H
-
-typedef unsigned short sa_family_t;
-
-#include "../../src/Win32_Interop/Win32_FDAPI.h"
-#include "../../src/Win32_Interop/Win32_APIs.h"
-
-#define cmsghdr _WSACMSGHDR
-#undef CMSG_DATA
-#define CMSG_DATA WSA_CMSG_DATA
-#define CMSG_SPACE WSA_CMSG_SPACE
-#define CMSG_FIRSTHDR WSA_CMSG_FIRSTHDR
-#define CMSG_LEN WSA_CMSG_LEN
-#define CMSG_NXTHDR WSA_CMSG_NXTHDR
-
-#define SCM_RIGHTS 1
-
-#define iovec _WSABUF
-#define iov_base buf
-#define iov_len len
-#define msghdr _WSAMSG
-#define msg_name name
-#define msg_namelen namelen
-#define msg_iov lpBuffers
-#define msg_iovlen dwBufferCount
-#define msg_control Control.buf
-#define msg_controllen Control.len
-#define msg_flags dwFlags
-
-int dumb_socketpair(SOCKET socks[2]);
-ssize_t sendmsg(int sockfd, struct msghdr *msg, int flags);
-ssize_t recvmsg(int sockfd, struct msghdr *msg, int flags);
-int socketpair(int domain, int type, int protocol, int sv[2]);
-
-#endif /* SOCKET_H */
diff --git a/src/common/shims/windows/sys/time.h b/src/common/shims/windows/sys/time.h
deleted file mode 100644
index 976342bd21215..0000000000000
--- a/src/common/shims/windows/sys/time.h
+++ /dev/null
@@ -1,12 +0,0 @@
-#ifndef TIME_H
-#define TIME_H
-
-#include <WinSock2.h> /* timeval */
-
-int gettimeofday_highres(struct timeval *tv, struct timezone *tz);
-
-static int gettimeofday(struct timeval *tv, struct timezone *tz) {
-  return gettimeofday_highres(tv, tz);
-}
-
-#endif /* TIME_H */
diff --git a/src/common/shims/windows/sys/un.h b/src/common/shims/windows/sys/un.h
deleted file mode 100644
index 91642683f72eb..0000000000000
--- a/src/common/shims/windows/sys/un.h
+++ /dev/null
@@ -1,13 +0,0 @@
-#ifndef UN_H
-#define UN_H
-
-#include <sys/socket.h>
-
-struct sockaddr_un {
-  /** AF_UNIX. */
-  sa_family_t sun_family;
-  /** The pathname. */
-  char sun_path[108];
-};
-
-#endif /* UN_H */
diff --git a/src/common/shims/windows/sys/wait.h b/src/common/shims/windows/sys/wait.h
deleted file mode 100644
index 442218408f976..0000000000000
--- a/src/common/shims/windows/sys/wait.h
+++ /dev/null
@@ -1,4 +0,0 @@
-#ifndef WAIT_H
-#define WAIT_H
-
-#endif /* WAIT_H */
diff --git a/src/common/shims/windows/unistd.h b/src/common/shims/windows/unistd.h
deleted file mode 100644
index aab25417e199b..0000000000000
--- a/src/common/shims/windows/unistd.h
+++ /dev/null
@@ -1,11 +0,0 @@
-#ifndef UNISTD_H
-#define UNISTD_H
-
-extern char *optarg;
-extern int optind, opterr, optopt;
-int getopt(int nargc, char *const nargv[], const char *ostr);
-
-#include "../../src/Win32_Interop/Win32_FDAPI.h"
-#define close(...) FDAPI_close(__VA_ARGS__)
-
-#endif /* UNISTD_H */
diff --git a/src/common/state/actor_notification_table.cc b/src/common/state/actor_notification_table.cc
deleted file mode 100644
index 19cd7fddda41e..0000000000000
--- a/src/common/state/actor_notification_table.cc
+++ /dev/null
@@ -1,47 +0,0 @@
-#include "actor_notification_table.h"
-
-#include "common_protocol.h"
-#include "redis.h"
-
-void publish_actor_creation_notification(DBHandle *db_handle,
-                                         const ActorID &actor_id,
-                                         const WorkerID &driver_id,
-                                         const DBClientID &local_scheduler_id) {
-  // Create a flatbuffer object to serialize and publish.
-  flatbuffers::FlatBufferBuilder fbb;
-  // Create the flatbuffers message.
-  auto message = CreateActorCreationNotification(
-      fbb, to_flatbuf(fbb, actor_id), to_flatbuf(fbb, driver_id),
-      to_flatbuf(fbb, local_scheduler_id));
-  fbb.Finish(message);
-
-  ActorCreationNotificationData *data =
-      (ActorCreationNotificationData *) malloc(
-          sizeof(ActorCreationNotificationData) + fbb.GetSize());
-  data->size = fbb.GetSize();
-  memcpy(&data->flatbuffer_data[0], fbb.GetBufferPointer(), fbb.GetSize());
-
-  init_table_callback(db_handle, UniqueID::nil(), __func__,
-                      new CommonCallbackData(data), NULL, NULL,
-                      redis_publish_actor_creation_notification, NULL);
-}
-
-void actor_notification_table_subscribe(
-    DBHandle *db_handle,
-    actor_notification_table_subscribe_callback subscribe_callback,
-    void *subscribe_context,
-    RetryInfo *retry) {
-  ActorNotificationTableSubscribeData *sub_data =
-      (ActorNotificationTableSubscribeData *) malloc(
-          sizeof(ActorNotificationTableSubscribeData));
-  sub_data->subscribe_callback = subscribe_callback;
-  sub_data->subscribe_context = subscribe_context;
-
-  init_table_callback(db_handle, UniqueID::nil(), __func__,
-                      new CommonCallbackData(sub_data), retry, NULL,
-                      redis_actor_notification_table_subscribe, NULL);
-}
-
-void actor_table_mark_removed(DBHandle *db_handle, ActorID actor_id) {
-  redis_actor_table_mark_removed(db_handle, actor_id);
-}
diff --git a/src/common/state/actor_notification_table.h b/src/common/state/actor_notification_table.h
deleted file mode 100644
index f6aa101cd0d01..0000000000000
--- a/src/common/state/actor_notification_table.h
+++ /dev/null
@@ -1,74 +0,0 @@
-#ifndef ACTOR_NOTIFICATION_TABLE_H
-#define ACTOR_NOTIFICATION_TABLE_H
-
-#include "task.h"
-#include "db.h"
-#include "table.h"
-
-/*
- *  ==== Subscribing to the actor notification table ====
- */
-
-/* Callback for subscribing to the local scheduler table. */
-typedef void (*actor_notification_table_subscribe_callback)(
-    const ActorID &actor_id,
-    const WorkerID &driver_id,
-    const DBClientID &local_scheduler_id,
-    void *user_context);
-
-/// Publish an actor creation notification. This is published by a local
-/// scheduler once it creates an actor.
-///
-/// \param db_handle Database handle.
-/// \param actor_id The ID of the actor that was created.
-/// \param driver_id The ID of the driver that created the actor.
-/// \param local_scheduler_id The ID of the local scheduler that created the
-///        actor.
-/// \return Void.
-void publish_actor_creation_notification(DBHandle *db_handle,
-                                         const ActorID &actor_id,
-                                         const WorkerID &driver_id,
-                                         const DBClientID &local_scheduler_id);
-
-/// Data that is needed to publish an actor creation notification.
-typedef struct {
-  /// The size of the flatbuffer object.
-  int64_t size;
-  /// The information to be sent.
-  uint8_t flatbuffer_data[0];
-} ActorCreationNotificationData;
-
-/**
- * Register a callback to process actor notification events.
- *
- * @param db_handle Database handle.
- * @param subscribe_callback Callback that will be called when the local
- *        scheduler event happens.
- * @param subscribe_context Context that will be passed into the
- *        subscribe_callback.
- * @param retry Information about retrying the request to the database.
- * @return Void.
- */
-void actor_notification_table_subscribe(
-    DBHandle *db_handle,
-    actor_notification_table_subscribe_callback subscribe_callback,
-    void *subscribe_context,
-    RetryInfo *retry);
-
-/* Data that is needed to register local scheduler table subscribe callbacks
- * with the state database. */
-typedef struct {
-  actor_notification_table_subscribe_callback subscribe_callback;
-  void *subscribe_context;
-} ActorNotificationTableSubscribeData;
-
-/**
- * Marks an actor as removed. This prevents the actor from being resurrected.
- *
- * @param db The database handle.
- * @param actor_id The actor id to mark as removed.
- * @return Void.
- */
-void actor_table_mark_removed(DBHandle *db_handle, ActorID actor_id);
-
-#endif /* ACTOR_NOTIFICATION_TABLE_H */
diff --git a/src/common/state/db.h b/src/common/state/db.h
deleted file mode 100644
index ac9960b89374b..0000000000000
--- a/src/common/state/db.h
+++ /dev/null
@@ -1,70 +0,0 @@
-#ifndef DB_H
-#define DB_H
-
-#include <vector>
-
-#include "common.h"
-#include "event_loop.h"
-
-typedef struct DBHandle DBHandle;
-
-/**
- * Connect to the global system store.
- *
- * @param db_address The hostname to use to connect to the database.
- * @param db_port The port to use to connect to the database.
- * @param db_shards_addresses The list of database shard IP addresses.
- * @param db_shards_ports The list of database shard ports, in the same order
- *        as db_shards_addresses.
- * @param client_type The type of this client.
- * @param node_ip_address The hostname of the client that is connecting.
- * @param args A vector of extra arguments strings. They should alternate
- *        between the name of the argument and the value of the argument. For
- *        examples: "port", "1234", "socket_name", "/tmp/s1". This vector should
- *        have an even length.
- * @return This returns a handle to the database, which must be freed with
- *         db_disconnect after use.
- */
-DBHandle *db_connect(const std::string &db_primary_address,
-                     int db_primary_port,
-                     const char *client_type,
-                     const char *node_ip_address,
-                     const std::vector<std::string> &args);
-
-/**
- * Attach global system store connection to an event loop. Callbacks from
- * queries to the global system store will trigger events in the event loop.
- *
- * @param db The handle to the database that is connected.
- * @param loop The event loop the database gets connected to.
- * @param reattach Can only be true in unit tests. If true, the database is
- *        reattached to the loop.
- * @return Void.
- */
-void db_attach(DBHandle *db, event_loop *loop, bool reattach);
-
-/**
- * Disconnect from the global system store.
- *
- * @param db The database connection to close and clean up.
- * @return Void.
- */
-void db_disconnect(DBHandle *db);
-
-/**
- * Free the database handle.
- *
- * @param db The database connection to clean up.
- * @return Void.
- */
-void DBHandle_free(DBHandle *db);
-
-/**
- * Returns the db client ID.
- *
- * @param db The handle to the database.
- * @returns int The db client ID for this connection to the database.
- */
-DBClientID get_db_client_id(DBHandle *db);
-
-#endif
diff --git a/src/common/state/db_client_table.cc b/src/common/state/db_client_table.cc
deleted file mode 100644
index b31e9d8c2d3a6..0000000000000
--- a/src/common/state/db_client_table.cc
+++ /dev/null
@@ -1,90 +0,0 @@
-#include "db_client_table.h"
-#include "redis.h"
-
-void db_client_table_remove(DBHandle *db_handle,
-                            DBClientID db_client_id,
-                            RetryInfo *retry,
-                            db_client_table_done_callback done_callback,
-                            void *user_context) {
-  init_table_callback(db_handle, db_client_id, __func__,
-                      new CommonCallbackData(NULL), retry,
-                      (table_done_callback) done_callback,
-                      redis_db_client_table_remove, user_context);
-}
-
-void db_client_table_subscribe(
-    DBHandle *db_handle,
-    db_client_table_subscribe_callback subscribe_callback,
-    void *subscribe_context,
-    RetryInfo *retry,
-    db_client_table_done_callback done_callback,
-    void *user_context) {
-  DBClientTableSubscribeData *sub_data =
-      (DBClientTableSubscribeData *) malloc(sizeof(DBClientTableSubscribeData));
-  sub_data->subscribe_callback = subscribe_callback;
-  sub_data->subscribe_context = subscribe_context;
-
-  init_table_callback(db_handle, UniqueID::nil(), __func__,
-                      new CommonCallbackData(sub_data), retry,
-                      (table_done_callback) done_callback,
-                      redis_db_client_table_subscribe, user_context);
-}
-
-const std::vector<std::string> db_client_table_get_ip_addresses(
-    DBHandle *db_handle,
-    const std::vector<DBClientID> &manager_ids) {
-  /* We time this function because in the past this loop has taken multiple
-   * seconds under stressful situations on hundreds of machines causing the
-   * plasma manager to die (because it went too long without sending
-   * heartbeats). */
-  int64_t start_time = current_time_ms();
-
-  /* Construct the manager vector from the flatbuffers object. */
-  std::vector<std::string> manager_vector;
-
-  for (auto const &manager_id : manager_ids) {
-    DBClient client = redis_cache_get_db_client(db_handle, manager_id);
-    RAY_CHECK(!client.manager_address.empty());
-    if (client.is_alive) {
-      manager_vector.push_back(client.manager_address);
-    }
-  }
-
-  int64_t end_time = current_time_ms();
-  if (end_time - start_time > RayConfig::instance().max_time_for_loop()) {
-    RAY_LOG(WARNING) << "calling redis_get_cached_db_client in a loop in with "
-                     << manager_ids.size() << " manager IDs took "
-                     << end_time - start_time << " milliseconds.";
-  }
-
-  return manager_vector;
-}
-
-void db_client_table_update_cache_callback(DBClient *db_client,
-                                           void *user_context) {
-  DBHandle *db_handle = (DBHandle *) user_context;
-  redis_cache_set_db_client(db_handle, *db_client);
-}
-
-void db_client_table_cache_init(DBHandle *db_handle) {
-  db_client_table_subscribe(db_handle, db_client_table_update_cache_callback,
-                            db_handle, NULL, NULL, NULL);
-}
-
-DBClient db_client_table_cache_get(DBHandle *db_handle, DBClientID client_id) {
-  RAY_CHECK(!client_id.is_nil());
-  return redis_cache_get_db_client(db_handle, client_id);
-}
-
-void plasma_manager_send_heartbeat(DBHandle *db_handle) {
-  RetryInfo heartbeat_retry;
-  heartbeat_retry.num_retries = 0;
-  heartbeat_retry.timeout =
-      RayConfig::instance().heartbeat_timeout_milliseconds();
-  heartbeat_retry.fail_callback = NULL;
-
-  init_table_callback(db_handle, UniqueID::nil(), __func__,
-                      new CommonCallbackData(NULL),
-                      (RetryInfo *) &heartbeat_retry, NULL,
-                      redis_plasma_manager_send_heartbeat, NULL);
-}
diff --git a/src/common/state/db_client_table.h b/src/common/state/db_client_table.h
deleted file mode 100644
index d140ba770eee2..0000000000000
--- a/src/common/state/db_client_table.h
+++ /dev/null
@@ -1,120 +0,0 @@
-#ifndef DB_CLIENT_TABLE_H
-#define DB_CLIENT_TABLE_H
-
-#include <vector>
-
-#include "db.h"
-#include "table.h"
-
-typedef void (*db_client_table_done_callback)(DBClientID db_client_id,
-                                              void *user_context);
-
-/**
- * Remove a client from the db clients table.
- *
- * @param db_handle Database handle.
- * @param db_client_id The database client ID to remove.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Function to be called when database returns result.
- * @param user_context Data that will be passed to done_callback and
- *        fail_callback.
- * @return Void.
- *
- */
-void db_client_table_remove(DBHandle *db_handle,
-                            DBClientID db_client_id,
-                            RetryInfo *retry,
-                            db_client_table_done_callback done_callback,
-                            void *user_context);
-
-/*
- *  ==== Subscribing to the db client table ====
- */
-
-/* An entry in the db client table. */
-typedef struct {
-  /** The database client ID. */
-  DBClientID id;
-  /** The database client type. */
-  std::string client_type;
-  /** An optional auxiliary address for the plasma manager associated with this
-   *  database client. */
-  std::string manager_address;
-  /** Whether or not the database client exists. If this is false for an entry,
-   *  then it will never again be true. */
-  bool is_alive;
-} DBClient;
-
-/* Callback for subscribing to the db client table. */
-typedef void (*db_client_table_subscribe_callback)(DBClient *db_client,
-                                                   void *user_context);
-
-/**
- * Register a callback for a db client table event.
- *
- * @param db_handle Database handle.
- * @param subscribe_callback Callback that will be called when the db client
- *        table is updated.
- * @param subscribe_context Context that will be passed into the
- *        subscribe_callback.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Function to be called when database returns result.
- * @param user_context Data that will be passed to done_callback and
- *        fail_callback.
- * @return Void.
- */
-void db_client_table_subscribe(
-    DBHandle *db_handle,
-    db_client_table_subscribe_callback subscribe_callback,
-    void *subscribe_context,
-    RetryInfo *retry,
-    db_client_table_done_callback done_callback,
-    void *user_context);
-
-/* Data that is needed to register db client table subscribe callbacks with the
- * state database. */
-typedef struct {
-  db_client_table_subscribe_callback subscribe_callback;
-  void *subscribe_context;
-} DBClientTableSubscribeData;
-
-const std::vector<std::string> db_client_table_get_ip_addresses(
-    DBHandle *db,
-    const std::vector<DBClientID> &manager_ids);
-
-/**
- * Initialize the db client cache. The cache is updated with each notification
- * from the db client table.
- *
- * @param db_handle Database handle.
- * @return Void.
- */
-void db_client_table_cache_init(DBHandle *db_handle);
-
-/**
- * Get a db client from the cache. If the requested client is not there,
- * request the latest entry from the db client table.
- *
- * @param db_handle Database handle.
- * @param client_id The ID of the client to look up in the cache.
- * @return The database client in the cache.
- */
-DBClient db_client_table_cache_get(DBHandle *db_handle, DBClientID client_id);
-
-/*
- * ==== Plasma manager heartbeats ====
- */
-
-/**
- * Start sending heartbeats to the plasma_managers channel. Each
- * heartbeat contains this database client's ID. Heartbeats can be subscribed
- * to through the plasma_managers channel. Once called, this "retries" the
- * heartbeat operation forever, every heartbeat_timeout_milliseconds
- * milliseconds.
- *
- * @param db_handle Database handle.
- * @return Void.
- */
-void plasma_manager_send_heartbeat(DBHandle *db_handle);
-
-#endif /* DB_CLIENT_TABLE_H */
diff --git a/src/common/state/driver_table.cc b/src/common/state/driver_table.cc
deleted file mode 100644
index b8732e9863b20..0000000000000
--- a/src/common/state/driver_table.cc
+++ /dev/null
@@ -1,23 +0,0 @@
-#include "driver_table.h"
-#include "redis.h"
-
-void driver_table_subscribe(DBHandle *db_handle,
-                            driver_table_subscribe_callback subscribe_callback,
-                            void *subscribe_context,
-                            RetryInfo *retry) {
-  DriverTableSubscribeData *sub_data =
-      (DriverTableSubscribeData *) malloc(sizeof(DriverTableSubscribeData));
-  sub_data->subscribe_callback = subscribe_callback;
-  sub_data->subscribe_context = subscribe_context;
-  init_table_callback(db_handle, UniqueID::nil(), __func__,
-                      new CommonCallbackData(sub_data), retry, NULL,
-                      redis_driver_table_subscribe, NULL);
-}
-
-void driver_table_send_driver_death(DBHandle *db_handle,
-                                    WorkerID driver_id,
-                                    RetryInfo *retry) {
-  init_table_callback(db_handle, driver_id, __func__,
-                      new CommonCallbackData(NULL), retry, NULL,
-                      redis_driver_table_send_driver_death, NULL);
-}
diff --git a/src/common/state/driver_table.h b/src/common/state/driver_table.h
deleted file mode 100644
index c8c6a6c32382c..0000000000000
--- a/src/common/state/driver_table.h
+++ /dev/null
@@ -1,50 +0,0 @@
-#ifndef DRIVER_TABLE_H
-#define DRIVER_TABLE_H
-
-#include "db.h"
-#include "table.h"
-#include "task.h"
-
-/*
- *  ==== Subscribing to the driver table ====
- */
-
-/* Callback for subscribing to the driver table. */
-typedef void (*driver_table_subscribe_callback)(WorkerID driver_id,
-                                                void *user_context);
-
-/**
- * Register a callback for a driver table event.
- *
- * @param db_handle Database handle.
- * @param subscribe_callback Callback that will be called when the driver event
- *        happens.
- * @param subscribe_context Context that will be passed into the
- *        subscribe_callback.
- * @param retry Information about retrying the request to the database.
- * @return Void.
- */
-void driver_table_subscribe(DBHandle *db_handle,
-                            driver_table_subscribe_callback subscribe_callback,
-                            void *subscribe_context,
-                            RetryInfo *retry);
-
-/* Data that is needed to register driver table subscribe callbacks with the
- * state database. */
-typedef struct {
-  driver_table_subscribe_callback subscribe_callback;
-  void *subscribe_context;
-} DriverTableSubscribeData;
-
-/**
- * Send driver death update to all subscribers.
- *
- * @param db_handle Database handle.
- * @param driver_id The ID of the driver that died.
- * @param retry Information about retrying the request to the database.
- */
-void driver_table_send_driver_death(DBHandle *db_handle,
-                                    WorkerID driver_id,
-                                    RetryInfo *retry);
-
-#endif /* DRIVER_TABLE_H */
diff --git a/src/common/state/error_table.cc b/src/common/state/error_table.cc
deleted file mode 100644
index d0fd9bdff5e9d..0000000000000
--- a/src/common/state/error_table.cc
+++ /dev/null
@@ -1,24 +0,0 @@
-#include "error_table.h"
-#include "redis.h"
-
-const char *error_types[] = {"object_hash_mismatch", "put_reconstruction",
-                             "worker_died", "actor_not_created"};
-
-void push_error(DBHandle *db_handle,
-                DBClientID driver_id,
-                ErrorIndex error_type,
-                const std::string &error_message) {
-  int64_t message_size = error_message.size();
-
-  /* Allocate a struct to hold the error information. */
-  ErrorInfo *info = (ErrorInfo *) malloc(sizeof(ErrorInfo) + message_size);
-  info->driver_id = driver_id;
-  info->error_type = error_type;
-  info->error_key = UniqueID::from_random();
-  info->size = message_size;
-  memcpy(info->error_message, error_message.data(), message_size);
-
-  init_table_callback(db_handle, UniqueID::nil(), __func__,
-                      new CommonCallbackData(info), NULL, NULL,
-                      redis_push_error, NULL);
-}
diff --git a/src/common/state/error_table.h b/src/common/state/error_table.h
deleted file mode 100644
index 908d7f4d0eaad..0000000000000
--- a/src/common/state/error_table.h
+++ /dev/null
@@ -1,50 +0,0 @@
-#ifndef ERROR_TABLE_H
-#define ERROR_TABLE_H
-
-#include "db.h"
-#include "table.h"
-
-/// An ErrorIndex may be used as an index into error_types.
-enum class ErrorIndex : int32_t {
-  /// An object was added with a different hash from the existing one.
-  OBJECT_HASH_MISMATCH = 0,
-  /// An object that was created through a ray.put is lost.
-  PUT_RECONSTRUCTION,
-  /// A worker died or was killed while executing a task.
-  WORKER_DIED,
-  /// An actor hasn't been created for a while.
-  ACTOR_NOT_CREATED,
-  /// The total number of error types.
-  MAX
-};
-
-/// Data that is needed to push an error.
-typedef struct {
-  /// The ID of the driver to push the error to.
-  DBClientID driver_id;
-  /// An index into the error_types array indicating the type of the error.
-  ErrorIndex error_type;
-  /// The key to use for the error message in Redis.
-  UniqueID error_key;
-  /// The length of the error message.
-  int64_t size;
-  /// The error message.
-  uint8_t error_message[0];
-} ErrorInfo;
-
-extern const char *error_types[];
-
-/// Push an error to the given Python driver.
-///
-/// \param db_handle Database handle.
-/// \param driver_id The ID of the Python driver to push the error to.
-/// \param error_type An index specifying the type of the error. This should
-/// be a value from the ErrorIndex enum.
-/// \param error_message The error message to print.
-/// \return Void.
-void push_error(DBHandle *db_handle,
-                DBClientID driver_id,
-                ErrorIndex error_type,
-                const std::string &error_message);
-
-#endif
diff --git a/src/common/state/local_scheduler_table.cc b/src/common/state/local_scheduler_table.cc
deleted file mode 100644
index 075d52102807c..0000000000000
--- a/src/common/state/local_scheduler_table.cc
+++ /dev/null
@@ -1,48 +0,0 @@
-#include "local_scheduler_table.h"
-
-#include "common_protocol.h"
-#include "redis.h"
-
-void local_scheduler_table_subscribe(
-    DBHandle *db_handle,
-    local_scheduler_table_subscribe_callback subscribe_callback,
-    void *subscribe_context,
-    RetryInfo *retry) {
-  LocalSchedulerTableSubscribeData *sub_data =
-      (LocalSchedulerTableSubscribeData *) malloc(
-          sizeof(LocalSchedulerTableSubscribeData));
-  sub_data->subscribe_callback = subscribe_callback;
-  sub_data->subscribe_context = subscribe_context;
-
-  init_table_callback(db_handle, UniqueID::nil(), __func__,
-                      new CommonCallbackData(sub_data), retry, NULL,
-                      redis_local_scheduler_table_subscribe, NULL);
-}
-
-void local_scheduler_table_send_info(DBHandle *db_handle,
-                                     LocalSchedulerInfo *info,
-                                     RetryInfo *retry) {
-  /* Create a flatbuffer object to serialize and publish. */
-  flatbuffers::FlatBufferBuilder fbb;
-  /* Create the flatbuffers message. */
-  auto message = CreateLocalSchedulerInfoMessage(
-      fbb, to_flatbuf(fbb, db_handle->client), info->total_num_workers,
-      info->task_queue_length, info->available_workers,
-      map_to_flatbuf(fbb, info->static_resources),
-      map_to_flatbuf(fbb, info->dynamic_resources), false);
-  fbb.Finish(message);
-
-  LocalSchedulerTableSendInfoData *data =
-      (LocalSchedulerTableSendInfoData *) malloc(
-          sizeof(LocalSchedulerTableSendInfoData) + fbb.GetSize());
-  data->size = fbb.GetSize();
-  memcpy(&data->flatbuffer_data[0], fbb.GetBufferPointer(), fbb.GetSize());
-
-  init_table_callback(db_handle, UniqueID::nil(), __func__,
-                      new CommonCallbackData(data), retry, NULL,
-                      redis_local_scheduler_table_send_info, NULL);
-}
-
-void local_scheduler_table_disconnect(DBHandle *db_handle) {
-  redis_local_scheduler_table_disconnect(db_handle);
-}
diff --git a/src/common/state/local_scheduler_table.h b/src/common/state/local_scheduler_table.h
deleted file mode 100644
index 239b84d0fa48e..0000000000000
--- a/src/common/state/local_scheduler_table.h
+++ /dev/null
@@ -1,98 +0,0 @@
-#ifndef LOCAL_SCHEDULER_TABLE_H
-#define LOCAL_SCHEDULER_TABLE_H
-
-#include <unordered_map>
-
-#include "db.h"
-#include "table.h"
-#include "task.h"
-
-/** This struct is sent with heartbeat messages from the local scheduler to the
- *  global scheduler, and it contains information about the load on the local
- *  scheduler. */
-typedef struct {
-  /** The total number of workers that are connected to this local scheduler. */
-  int total_num_workers;
-  /** The number of tasks queued in this local scheduler. */
-  int task_queue_length;
-  /** The number of workers that are available and waiting for tasks. */
-  int available_workers;
-  /** The resource vector of resources generally available to this local
-   *  scheduler. */
-  std::unordered_map<std::string, double> static_resources;
-  /** The resource vector of resources currently available to this local
-   *  scheduler. */
-  std::unordered_map<std::string, double> dynamic_resources;
-  /** Whether the local scheduler is dead. If true, then all other fields
-   *  should be ignored. */
-  bool is_dead;
-} LocalSchedulerInfo;
-
-/*
- *  ==== Subscribing to the local scheduler table ====
- */
-
-/* Callback for subscribing to the local scheduler table. */
-typedef void (*local_scheduler_table_subscribe_callback)(
-    DBClientID client_id,
-    LocalSchedulerInfo info,
-    void *user_context);
-
-/**
- * Register a callback for a local scheduler table event.
- *
- * @param db_handle Database handle.
- * @param subscribe_callback Callback that will be called when the local
- *        scheduler event happens.
- * @param subscribe_context Context that will be passed into the
- *        subscribe_callback.
- * @param retry Information about retrying the request to the database.
- * @return Void.
- */
-void local_scheduler_table_subscribe(
-    DBHandle *db_handle,
-    local_scheduler_table_subscribe_callback subscribe_callback,
-    void *subscribe_context,
-    RetryInfo *retry);
-
-/* Data that is needed to register local scheduler table subscribe callbacks
- * with the state database. */
-typedef struct {
-  local_scheduler_table_subscribe_callback subscribe_callback;
-  void *subscribe_context;
-} LocalSchedulerTableSubscribeData;
-
-/**
- * Send a heartbeat to all subscribers to the local scheduler table. This
- * heartbeat contains some information about the load on the local scheduler.
- *
- * @param db_handle Database handle.
- * @param info Information about the local scheduler, including the load on the
- *        local scheduler.
- * @param retry Information about retrying the request to the database.
- * @return Void.
- */
-void local_scheduler_table_send_info(DBHandle *db_handle,
-                                     LocalSchedulerInfo *info,
-                                     RetryInfo *retry);
-
-/* Data that is needed to publish local scheduler heartbeats to the local
- * scheduler table. */
-typedef struct {
-  /* The size of the flatbuffer object. */
-  int64_t size;
-  /* The information to be sent. */
-  uint8_t flatbuffer_data[0];
-} LocalSchedulerTableSendInfoData;
-
-/**
- * Send a null heartbeat to all subscribers to the local scheduler table to
- * notify them that we are about to exit. This operation is performed
- * synchronously.
- *
- * @param db_handle Database handle.
- * @return Void.
- */
-void local_scheduler_table_disconnect(DBHandle *db_handle);
-
-#endif /* LOCAL_SCHEDULER_TABLE_H */
diff --git a/src/common/state/object_table.cc b/src/common/state/object_table.cc
deleted file mode 100644
index fcd527e62f6a4..0000000000000
--- a/src/common/state/object_table.cc
+++ /dev/null
@@ -1,119 +0,0 @@
-#include "object_table.h"
-#include "redis.h"
-
-void object_table_lookup(DBHandle *db_handle,
-                         ObjectID object_id,
-                         RetryInfo *retry,
-                         object_table_lookup_done_callback done_callback,
-                         void *user_context) {
-  RAY_CHECK(db_handle != NULL);
-  init_table_callback(db_handle, object_id, __func__,
-                      new CommonCallbackData(NULL), retry,
-                      (table_done_callback) done_callback,
-                      redis_object_table_lookup, user_context);
-}
-
-void object_table_add(DBHandle *db_handle,
-                      ObjectID object_id,
-                      int64_t object_size,
-                      unsigned char digest[],
-                      RetryInfo *retry,
-                      object_table_done_callback done_callback,
-                      void *user_context) {
-  RAY_CHECK(db_handle != NULL);
-
-  ObjectTableAddData *info =
-      (ObjectTableAddData *) malloc(sizeof(ObjectTableAddData));
-  info->object_size = object_size;
-  memcpy(&info->digest[0], digest, DIGEST_SIZE);
-  init_table_callback(db_handle, object_id, __func__,
-                      new CommonCallbackData(info), retry,
-                      (table_done_callback) done_callback,
-                      redis_object_table_add, user_context);
-}
-
-void object_table_remove(DBHandle *db_handle,
-                         ObjectID object_id,
-                         DBClientID *client_id,
-                         RetryInfo *retry,
-                         object_table_done_callback done_callback,
-                         void *user_context) {
-  RAY_CHECK(db_handle != NULL);
-  /* Copy the client ID, if one was provided. */
-  DBClientID *client_id_copy = NULL;
-  if (client_id != NULL) {
-    client_id_copy = (DBClientID *) malloc(sizeof(DBClientID));
-    *client_id_copy = *client_id;
-  }
-  init_table_callback(db_handle, object_id, __func__,
-                      new CommonCallbackData(client_id_copy), retry,
-                      (table_done_callback) done_callback,
-                      redis_object_table_remove, user_context);
-}
-
-void object_table_subscribe_to_notifications(
-    DBHandle *db_handle,
-    bool subscribe_all,
-    object_table_object_available_callback object_available_callback,
-    void *subscribe_context,
-    RetryInfo *retry,
-    object_table_lookup_done_callback done_callback,
-    void *user_context) {
-  RAY_CHECK(db_handle != NULL);
-  ObjectTableSubscribeData *sub_data =
-      (ObjectTableSubscribeData *) malloc(sizeof(ObjectTableSubscribeData));
-  sub_data->object_available_callback = object_available_callback;
-  sub_data->subscribe_context = subscribe_context;
-  sub_data->subscribe_all = subscribe_all;
-
-  init_table_callback(
-      db_handle, ObjectID::nil(), __func__, new CommonCallbackData(sub_data),
-      retry, (table_done_callback) done_callback,
-      redis_object_table_subscribe_to_notifications, user_context);
-}
-
-void object_table_request_notifications(DBHandle *db_handle,
-                                        int num_object_ids,
-                                        ObjectID object_ids[],
-                                        RetryInfo *retry) {
-  RAY_CHECK(db_handle != NULL);
-  RAY_CHECK(num_object_ids > 0);
-  ObjectTableRequestNotificationsData *data =
-      (ObjectTableRequestNotificationsData *) malloc(
-          sizeof(ObjectTableRequestNotificationsData) +
-          num_object_ids * sizeof(ObjectID));
-  data->num_object_ids = num_object_ids;
-  memcpy(data->object_ids, object_ids, num_object_ids * sizeof(ObjectID));
-
-  init_table_callback(db_handle, ObjectID::nil(), __func__,
-                      new CommonCallbackData(data), retry, NULL,
-                      redis_object_table_request_notifications, NULL);
-}
-
-void result_table_add(DBHandle *db_handle,
-                      ObjectID object_id,
-                      TaskID task_id,
-                      bool is_put,
-                      RetryInfo *retry,
-                      result_table_done_callback done_callback,
-                      void *user_context) {
-  ResultTableAddInfo *info =
-      (ResultTableAddInfo *) malloc(sizeof(ResultTableAddInfo));
-  info->task_id = task_id;
-  info->is_put = is_put;
-  init_table_callback(db_handle, object_id, __func__,
-                      new CommonCallbackData(info), retry,
-                      (table_done_callback) done_callback,
-                      redis_result_table_add, user_context);
-}
-
-void result_table_lookup(DBHandle *db_handle,
-                         ObjectID object_id,
-                         RetryInfo *retry,
-                         result_table_lookup_callback done_callback,
-                         void *user_context) {
-  init_table_callback(db_handle, object_id, __func__,
-                      new CommonCallbackData(NULL), retry,
-                      (table_done_callback) done_callback,
-                      redis_result_table_lookup, user_context);
-}
diff --git a/src/common/state/object_table.h b/src/common/state/object_table.h
deleted file mode 100644
index 77a299dfd30a8..0000000000000
--- a/src/common/state/object_table.h
+++ /dev/null
@@ -1,242 +0,0 @@
-#ifndef OBJECT_TABLE_H
-#define OBJECT_TABLE_H
-
-#include "common.h"
-#include "table.h"
-#include "db.h"
-#include "task.h"
-
-/*
- *  ==== Lookup call and callback ====
- */
-
-/* Callback called when the lookup completes. The callback should free
- * the manager_vector array, but NOT the strings they are pointing to. If there
- * was no entry at all for the object (the object had never been created
- * before), then never_created will be true.
- */
-typedef void (*object_table_lookup_done_callback)(
-    ObjectID object_id,
-    bool never_created,
-    const std::vector<DBClientID> &manager_ids,
-    void *user_context);
-
-/* Callback called when object ObjectID is available. */
-typedef void (*object_table_object_available_callback)(
-    ObjectID object_id,
-    int64_t data_size,
-    const std::vector<DBClientID> &manager_ids,
-    void *user_context);
-
-/**
- *  Return the list of nodes storing object_id in their plasma stores.
- *
- *  @param db_handle Handle to object_table database.
- *  @param object_id ID of the object being looked up.
- *  @param retry Information about retrying the request to the database.
- *  @param done_callback Function to be called when database returns result.
- *  @param user_context Context passed by the caller.
- *  @return Void.
- */
-void object_table_lookup(DBHandle *db_handle,
-                         ObjectID object_id,
-                         RetryInfo *retry,
-                         object_table_lookup_done_callback done_callback,
-                         void *user_context);
-
-/*
- *  ==== Add object call and callback ====
- */
-
-/**
- * Callback called when the object add/remove operation completes.
- *
- * @param object_id The ID of the object that was added or removed.
- * @param success Whether the operation was successful or not. If this is false
- *        and the operation was an addition, the object was added, but there
- *        was a hash mismatch.
- * @param user_context The user context that was passed into the add/remove
- *        call.
- */
-typedef void (*object_table_done_callback)(ObjectID object_id,
-                                           bool success,
-                                           void *user_context);
-
-/**
- * Add the plasma manager that created the db_handle to the
- * list of plasma managers that have the object_id.
- *
- * @param db_handle Handle to db.
- * @param object_id Object unique identifier.
- * @param data_size Object data size.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Callback to be called when lookup completes.
- * @param user_context User context to be passed in the callbacks.
- * @return Void.
- */
-void object_table_add(DBHandle *db_handle,
-                      ObjectID object_id,
-                      int64_t object_size,
-                      unsigned char digest[],
-                      RetryInfo *retry,
-                      object_table_done_callback done_callback,
-                      void *user_context);
-
-/** Data that is needed to add new objects to the object table. */
-typedef struct {
-  int64_t object_size;
-  unsigned char digest[DIGEST_SIZE];
-} ObjectTableAddData;
-
-/*
- *  ==== Remove object call and callback ====
- */
-
-/**
- * Object remove function.
- *
- * @param db_handle Handle to db.
- * @param object_id Object unique identifier.
- * @param client_id A pointer to the database client ID to remove. If this is
- *        set to NULL, then the client ID associated with db_handle will be
- *        removed.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Callback to be called when lookup completes.
- * @param user_context User context to be passed in the callbacks.
- * @return Void.
- */
-void object_table_remove(DBHandle *db_handle,
-                         ObjectID object_id,
-                         DBClientID *client_id,
-                         RetryInfo *retry,
-                         object_table_done_callback done_callback,
-                         void *user_context);
-
-/*
- *  ==== Subscribe to be announced when new object available ====
- */
-
-/**
- * Set up a client-specific channel for receiving notifications about available
- * objects from the object table. The callback will be called once per
- * notification received on this channel.
- *
- * @param db_handle Handle to db.
- * @param object_available_callback Callback to be called when new object
- *        becomes available.
- * @param subscribe_context Caller context which will be passed to the
- *        object_available_callback.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Callback to be called when subscription is installed.
- *        This is only used for the tests.
- * @param user_context User context to be passed into the done callback. This is
- *        only used for the tests.
- * @return Void.
- */
-void object_table_subscribe_to_notifications(
-    DBHandle *db_handle,
-    bool subscribe_all,
-    object_table_object_available_callback object_available_callback,
-    void *subscribe_context,
-    RetryInfo *retry,
-    object_table_lookup_done_callback done_callback,
-    void *user_context);
-
-/**
- * Request notifications about the availability of some objects from the object
- * table. The notifications will be published to this client's object
- * notification channel, which was set up by the method
- * object_table_subscribe_to_notifications.
- *
- * @param db_handle Handle to db.
- * @param object_ids The object IDs to receive notifications about.
- * @param retry Information about retrying the request to the database.
- * @return Void.
- */
-void object_table_request_notifications(DBHandle *db,
-                                        int num_object_ids,
-                                        ObjectID object_ids[],
-                                        RetryInfo *retry);
-
-/** Data that is needed to run object_request_notifications requests. */
-typedef struct {
-  /** The number of object IDs. */
-  int num_object_ids;
-  /** This field is used to store a variable number of object IDs. */
-  ObjectID object_ids[0];
-} ObjectTableRequestNotificationsData;
-
-/** Data that is needed to register new object available callbacks with the
- *  state database. */
-typedef struct {
-  bool subscribe_all;
-  object_table_object_available_callback object_available_callback;
-  void *subscribe_context;
-} ObjectTableSubscribeData;
-
-/*
- *  ==== Result table ====
- */
-
-/**
- * Callback called when the add/remove operation for a result table entry
- * completes. */
-typedef void (*result_table_done_callback)(ObjectID object_id,
-                                           void *user_context);
-
-/** Information about a result table entry to add. */
-typedef struct {
-  /** The task ID of the task that created the requested object. */
-  TaskID task_id;
-  /** True if the object was created through a put, and false if created by
-   *  return value. */
-  bool is_put;
-} ResultTableAddInfo;
-
-/**
- * Add information about a new object to the object table. This
- * is immutable information like the ID of the task that
- * created the object.
- *
- * @param db_handle Handle to object_table database.
- * @param object_id ID of the object to add.
- * @param task_id ID of the task that creates this object.
- * @param is_put A boolean that is true if the object was created through a
- *        ray.put, and false if the object was created by return value.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Function to be called when database returns result.
- * @param user_context Context passed by the caller.
- * @return Void.
- */
-void result_table_add(DBHandle *db_handle,
-                      ObjectID object_id,
-                      TaskID task_id,
-                      bool is_put,
-                      RetryInfo *retry,
-                      result_table_done_callback done_callback,
-                      void *user_context);
-
-/** Callback called when the result table lookup completes. */
-typedef void (*result_table_lookup_callback)(ObjectID object_id,
-                                             TaskID task_id,
-                                             bool is_put,
-                                             void *user_context);
-
-/**
- * Lookup the task that created an object in the result table. The return value
- * is the task ID.
- *
- * @param db_handle Handle to object_table database.
- * @param object_id ID of the object to lookup.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Function to be called when database returns result.
- * @param user_context Context passed by the caller.
- * @return Void.
- */
-void result_table_lookup(DBHandle *db_handle,
-                         ObjectID object_id,
-                         RetryInfo *retry,
-                         result_table_lookup_callback done_callback,
-                         void *user_context);
-
-#endif /* OBJECT_TABLE_H */
diff --git a/src/common/state/redis.cc b/src/common/state/redis.cc
deleted file mode 100644
index 17a3c8ce2d3a5..0000000000000
--- a/src/common/state/redis.cc
+++ /dev/null
@@ -1,1692 +0,0 @@
-/* Redis implementation of the global state store */
-
-#include <assert.h>
-#include <stdlib.h>
-#include <unistd.h>
-#include <vector>
-
-extern "C" {
-/* Including hiredis here is necessary on Windows for typedefs used in ae.h. */
-#include "hiredis/hiredis.h"
-#include "hiredis/adapters/ae.h"
-}
-
-#include "common.h"
-#include "db.h"
-#include "db_client_table.h"
-#include "actor_notification_table.h"
-#include "driver_table.h"
-#include "local_scheduler_table.h"
-#include "object_table.h"
-#include "task.h"
-#include "task_table.h"
-#include "error_table.h"
-#include "event_loop.h"
-#include "redis.h"
-#include "io.h"
-#include "net.h"
-
-#include "format/common_generated.h"
-
-#include "common_protocol.h"
-
-#ifndef _WIN32
-/* This function is actually not declared in standard POSIX, so declare it. */
-extern int usleep(useconds_t usec);
-#endif
-
-#define CHECK_REDIS_CONNECT(CONTEXT_TYPE, context, M, ...)  \
-  do {                                                      \
-    CONTEXT_TYPE *_context = (context);                     \
-    if (!_context) {                                        \
-      RAY_LOG(FATAL) << "could not allocate redis context"; \
-    }                                                       \
-    if (_context->err) {                                    \
-      RAY_LOG(ERROR) << M;                                  \
-      LOG_REDIS_ERROR(_context, "");                        \
-      exit(-1);                                             \
-    }                                                       \
-  } while (0)
-
-/**
- * A header for callbacks of a single Redis asynchronous command. The user must
- * pass in the table operation's timer ID as the asynchronous command's
- * privdata field when executing the asynchronous command. The user must define
- * variable names for DB and CB_DATA. After this piece of code runs, DB
- * will hold a reference to the database handle, CB_DATA will hold a reference
- * to the callback data for this table operation. The user must pass in the
- * redisReply pointer as the REPLY argument.
- *
- * This header also short-circuits the entire callback if: (1) there was no
- * reply from Redis, or (2) the callback data for this table operation was
- * already removed, meaning that the operation was already marked as succeeded
- * or failed.
- */
-#define REDIS_CALLBACK_HEADER(DB, CB_DATA, REPLY)                              \
-  if ((REPLY) == NULL) {                                                       \
-    return;                                                                    \
-  }                                                                            \
-  DBHandle *DB = (DBHandle *) c->data;                                         \
-  TableCallbackData *CB_DATA = outstanding_callbacks_find((int64_t) privdata); \
-  if (CB_DATA == NULL) {                                                       \
-    /* the callback data structure has been                                    \
-     * already freed; just ignore this reply */                                \
-    return;                                                                    \
-  }                                                                            \
-  do {                                                                         \
-  } while (0)
-
-redisAsyncContext *get_redis_context(DBHandle *db, UniqueID id) {
-  /* NOTE: The hash function used here must match the one in
-   * PyObjectID_redis_shard_hash in src/common/lib/python/common_extension.cc.
-   * Changes to the hash function should only be made through
-   * std::hash in src/common/common.h */
-  std::hash<ray::UniqueID> index;
-  return db->contexts[index(id) % db->contexts.size()];
-}
-
-redisAsyncContext *get_redis_subscribe_context(DBHandle *db, UniqueID id) {
-  std::hash<ray::UniqueID> index;
-  return db->subscribe_contexts[index(id) % db->subscribe_contexts.size()];
-}
-
-void get_redis_shards(redisContext *context,
-                      std::vector<std::string> &db_shards_addresses,
-                      std::vector<int> &db_shards_ports) {
-  /* Get the total number of Redis shards in the system. */
-  int num_attempts = 0;
-  redisReply *reply = NULL;
-  while (num_attempts < RayConfig::instance().redis_db_connect_retries()) {
-    /* Try to read the number of Redis shards from the primary shard. If the
-     * entry is present, exit. */
-    reply = (redisReply *) redisCommand(context, "GET NumRedisShards");
-    if (reply->type != REDIS_REPLY_NIL) {
-      break;
-    }
-
-    /* Sleep for a little, and try again if the entry isn't there yet. */
-    freeReplyObject(reply);
-    usleep(RayConfig::instance().redis_db_connect_wait_milliseconds() * 1000);
-    num_attempts++;
-    continue;
-  }
-  RAY_CHECK(num_attempts < RayConfig::instance().redis_db_connect_retries())
-      << "No entry found for NumRedisShards";
-  RAY_CHECK(reply->type == REDIS_REPLY_STRING)
-      << "Expected string, found Redis type " << reply->type
-      << " for NumRedisShards";
-  int num_redis_shards = atoi(reply->str);
-  RAY_CHECK(num_redis_shards >= 1) << "Expected at least one Redis shard, "
-                                   << "found " << num_redis_shards;
-  freeReplyObject(reply);
-
-  /* Get the addresses of all of the Redis shards. */
-  num_attempts = 0;
-  while (num_attempts < RayConfig::instance().redis_db_connect_retries()) {
-    /* Try to read the Redis shard locations from the primary shard. If we find
-     * that all of them are present, exit. */
-    reply = (redisReply *) redisCommand(context, "LRANGE RedisShards 0 -1");
-    if (static_cast<int>(reply->elements) == num_redis_shards) {
-      break;
-    }
-
-    /* Sleep for a little, and try again if not all Redis shard addresses have
-     * been added yet. */
-    freeReplyObject(reply);
-    usleep(RayConfig::instance().redis_db_connect_wait_milliseconds() * 1000);
-    num_attempts++;
-    continue;
-  }
-  RAY_CHECK(num_attempts < RayConfig::instance().redis_db_connect_retries())
-      << "Expected " << num_redis_shards << " Redis shard addresses, found "
-      << reply->elements;
-
-  /* Parse the Redis shard addresses. */
-  char db_shard_address[16];
-  int db_shard_port;
-  for (size_t i = 0; i < reply->elements; ++i) {
-    /* Parse the shard addresses and ports. */
-    RAY_CHECK(reply->element[i]->type == REDIS_REPLY_STRING);
-    RAY_CHECK(parse_ip_addr_port(reply->element[i]->str, db_shard_address,
-                                 &db_shard_port) == 0);
-    db_shards_addresses.push_back(std::string(db_shard_address));
-    db_shards_ports.push_back(db_shard_port);
-  }
-  freeReplyObject(reply);
-}
-
-void db_connect_shard(const std::string &db_address,
-                      int db_port,
-                      DBClientID client,
-                      const char *client_type,
-                      const char *node_ip_address,
-                      const std::vector<std::string> &args,
-                      DBHandle *db,
-                      redisAsyncContext **context_out,
-                      redisAsyncContext **subscribe_context_out,
-                      redisContext **sync_context_out) {
-  /* Synchronous connection for initial handshake */
-  redisReply *reply;
-  int connection_attempts = 0;
-  redisContext *sync_context = redisConnect(db_address.c_str(), db_port);
-  while (sync_context == NULL || sync_context->err) {
-    if (connection_attempts >=
-        RayConfig::instance().redis_db_connect_retries()) {
-      break;
-    }
-    RAY_LOG(WARNING) << "Failed to connect to Redis, retrying.";
-    /* Sleep for a little. */
-    usleep(RayConfig::instance().redis_db_connect_wait_milliseconds() * 1000);
-    sync_context = redisConnect(db_address.c_str(), db_port);
-    connection_attempts += 1;
-  }
-  CHECK_REDIS_CONNECT(redisContext, sync_context,
-                      "could not establish synchronous connection to redis "
-                      "%s:%d",
-                      db_address.c_str(), db_port);
-  /* Configure Redis to generate keyspace notifications for list events. This
-   * should only need to be done once (by whoever started Redis), but since
-   * Redis may be started in multiple places (e.g., for testing or when starting
-   * processes by hand), it is easier to do it multiple times. */
-  reply = (redisReply *) redisCommand(sync_context,
-                                      "CONFIG SET notify-keyspace-events Kl");
-  RAY_CHECK(reply != NULL) << "db_connect failed on CONFIG SET";
-  freeReplyObject(reply);
-  /* Also configure Redis to not run in protected mode, so clients on other
-   * hosts can connect to it. */
-  reply =
-      (redisReply *) redisCommand(sync_context, "CONFIG SET protected-mode no");
-  RAY_CHECK(reply != NULL) << "db_connect failed on CONFIG SET";
-  freeReplyObject(reply);
-
-  /* Construct the argument arrays for RAY.CONNECT. */
-  int argc = args.size() + 4;
-  const char **argv = (const char **) malloc(sizeof(char *) * argc);
-  size_t *argvlen = (size_t *) malloc(sizeof(size_t) * argc);
-  /* Set the command name argument. */
-  argv[0] = "RAY.CONNECT";
-  argvlen[0] = strlen(argv[0]);
-  /* Set the client ID argument. */
-  argv[1] = (char *) client.data();
-  argvlen[1] = sizeof(client);
-  /* Set the node IP address argument. */
-  argv[2] = node_ip_address;
-  argvlen[2] = strlen(node_ip_address);
-  /* Set the client type argument. */
-  argv[3] = client_type;
-  argvlen[3] = strlen(client_type);
-  /* Set the remaining arguments. */
-  for (size_t i = 0; i < args.size(); ++i) {
-    argv[4 + i] = args[i].c_str();
-    argvlen[4 + i] = strlen(args[i].c_str());
-  }
-
-  /* Register this client with Redis. RAY.CONNECT is a custom Redis command that
-   * we've defined. */
-  reply = (redisReply *) redisCommandArgv(sync_context, argc, argv, argvlen);
-  RAY_CHECK(reply != NULL) << "db_connect failed on RAY.CONNECT";
-  RAY_CHECK(reply->type != REDIS_REPLY_ERROR) << "reply->str is " << reply->str;
-  RAY_CHECK(strcmp(reply->str, "OK") == 0) << "reply->str is " << reply->str;
-  freeReplyObject(reply);
-  free(argv);
-  free(argvlen);
-
-  *sync_context_out = sync_context;
-
-  /* Establish connection for control data. */
-  redisAsyncContext *context = redisAsyncConnect(db_address.c_str(), db_port);
-  CHECK_REDIS_CONNECT(redisAsyncContext, context,
-                      "could not establish asynchronous connection to redis "
-                      "%s:%d",
-                      db_address.c_str(), db_port);
-  context->data = (void *) db;
-  *context_out = context;
-
-  /* Establish async connection for subscription. */
-  redisAsyncContext *subscribe_context =
-      redisAsyncConnect(db_address.c_str(), db_port);
-  CHECK_REDIS_CONNECT(redisAsyncContext, subscribe_context,
-                      "could not establish asynchronous subscription "
-                      "connection to redis %s:%d",
-                      db_address.c_str(), db_port);
-  subscribe_context->data = (void *) db;
-  *subscribe_context_out = subscribe_context;
-}
-
-DBHandle *db_connect(const std::string &db_primary_address,
-                     int db_primary_port,
-                     const char *client_type,
-                     const char *node_ip_address,
-                     const std::vector<std::string> &args) {
-  /* Check that the number of args is even. These args will be passed to the
-   * RAY.CONNECT Redis command, which takes arguments in pairs. */
-  if (args.size() % 2 != 0) {
-    RAY_LOG(FATAL) << "The number of extra args must be divisible by two.";
-  }
-
-  /* Create a client ID for this client. */
-  DBClientID client = DBClientID::from_random();
-
-  DBHandle *db = new DBHandle();
-
-  db->client_type = strdup(client_type);
-  db->client = client;
-
-  redisAsyncContext *context;
-  redisAsyncContext *subscribe_context;
-  redisContext *sync_context;
-
-  /* Connect to the primary redis instance. */
-  db_connect_shard(db_primary_address, db_primary_port, client, client_type,
-                   node_ip_address, args, db, &context, &subscribe_context,
-                   &sync_context);
-  db->context = context;
-  db->subscribe_context = subscribe_context;
-  db->sync_context = sync_context;
-
-  /* Get the shard locations. */
-  std::vector<std::string> db_shards_addresses;
-  std::vector<int> db_shards_ports;
-  get_redis_shards(db->sync_context, db_shards_addresses, db_shards_ports);
-  RAY_CHECK(db_shards_addresses.size() > 0) << "No Redis shards found";
-  /* Connect to the shards. */
-  for (size_t i = 0; i < db_shards_addresses.size(); ++i) {
-    db_connect_shard(db_shards_addresses[i], db_shards_ports[i], client,
-                     client_type, node_ip_address, args, db, &context,
-                     &subscribe_context, &sync_context);
-    db->contexts.push_back(context);
-    db->subscribe_contexts.push_back(subscribe_context);
-    redisFree(sync_context);
-  }
-
-  return db;
-}
-
-void DBHandle_free(DBHandle *db) {
-  /* Clean up the primary Redis connection state. */
-  redisFree(db->sync_context);
-  redisAsyncFree(db->context);
-  redisAsyncFree(db->subscribe_context);
-
-  /* Clean up the Redis shards. */
-  RAY_CHECK(db->contexts.size() == db->subscribe_contexts.size());
-  for (size_t i = 0; i < db->contexts.size(); ++i) {
-    redisAsyncFree(db->contexts[i]);
-    redisAsyncFree(db->subscribe_contexts[i]);
-  }
-
-  free(db->client_type);
-  delete db;
-}
-
-void db_disconnect(DBHandle *db) {
-  /* Notify others that this client is disconnecting from Redis. If a client of
-   * the same type on the same node wants to reconnect again, they must
-   * reconnect and get assigned a different client ID. */
-  redisReply *reply =
-      (redisReply *) redisCommand(db->sync_context, "RAY.DISCONNECT %b",
-                                  db->client.data(), sizeof(db->client));
-  RAY_CHECK(reply->type != REDIS_REPLY_ERROR) << "reply->str is " << reply->str;
-  RAY_CHECK(strcmp(reply->str, "OK") == 0) << "reply->str is " << reply->str;
-  freeReplyObject(reply);
-
-  DBHandle_free(db);
-}
-
-void db_attach(DBHandle *db, event_loop *loop, bool reattach) {
-  db->loop = loop;
-  /* Attach primary redis instance to the event loop. */
-  int err = redisAeAttach(loop, db->context);
-  /* If the database is reattached in the tests, redis normally gives
-   * an error which we can safely ignore. */
-  if (!reattach) {
-    RAY_CHECK(err == REDIS_OK) << "failed to attach the event loop";
-  }
-  err = redisAeAttach(loop, db->subscribe_context);
-  if (!reattach) {
-    RAY_CHECK(err == REDIS_OK) << "failed to attach the event loop";
-  }
-  /* Attach other redis shards to the event loop. */
-  RAY_CHECK(db->contexts.size() == db->subscribe_contexts.size());
-  for (size_t i = 0; i < db->contexts.size(); ++i) {
-    int err = redisAeAttach(loop, db->contexts[i]);
-    /* If the database is reattached in the tests, redis normally gives
-     * an error which we can safely ignore. */
-    if (!reattach) {
-      RAY_CHECK(err == REDIS_OK) << "failed to attach the event loop";
-    }
-    err = redisAeAttach(loop, db->subscribe_contexts[i]);
-    if (!reattach) {
-      RAY_CHECK(err == REDIS_OK) << "failed to attach the event loop";
-    }
-  }
-}
-
-/*
- *  ==== object_table callbacks ====
- */
-
-void redis_object_table_add_callback(redisAsyncContext *c,
-                                     void *r,
-                                     void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  /* Do some minimal checking. */
-  redisReply *reply = (redisReply *) r;
-  bool success = (strcmp(reply->str, "hash mismatch") != 0);
-  if (!success) {
-    /* If our object hash doesn't match the one recorded in the table, report
-     * the error back to the user and exit immediately. */
-    RAY_LOG(WARNING) << "Found objects with different value but same object "
-                     << "ID, most likely because a nondeterministic task was "
-                     << "executed twice, either for reconstruction or for "
-                     << "speculation.";
-  } else {
-    RAY_CHECK(reply->type != REDIS_REPLY_ERROR) << "reply->str is "
-                                                << reply->str;
-    RAY_CHECK(strcmp(reply->str, "OK") == 0) << "reply->str is " << reply->str;
-  }
-  /* Call the done callback if there is one. */
-  if (callback_data->done_callback != NULL) {
-    object_table_done_callback done_callback =
-        (object_table_done_callback) callback_data->done_callback;
-    done_callback(callback_data->id, success, callback_data->user_context);
-  }
-  /* Clean up the timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_object_table_add(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-
-  ObjectTableAddData *info = (ObjectTableAddData *) callback_data->data->Get();
-  ObjectID obj_id = callback_data->id;
-  int64_t object_size = info->object_size;
-  unsigned char *digest = info->digest;
-
-  redisAsyncContext *context = get_redis_context(db, obj_id);
-
-  int status = redisAsyncCommand(
-      context, redis_object_table_add_callback,
-      (void *) callback_data->timer_id, "RAY.OBJECT_TABLE_ADD %b %lld %b %b",
-      obj_id.data(), sizeof(obj_id), (long long) object_size, digest,
-      (size_t) DIGEST_SIZE, db->client.data(), sizeof(db->client));
-
-  if ((status == REDIS_ERR) || context->err) {
-    LOG_REDIS_DEBUG(context, "error in redis_object_table_add");
-  }
-}
-
-void redis_object_table_remove_callback(redisAsyncContext *c,
-                                        void *r,
-                                        void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  /* Do some minimal checking. */
-  redisReply *reply = (redisReply *) r;
-  if (strcmp(reply->str, "object not found") == 0) {
-    /* If our object entry was not in the table, it's probably a race
-     * condition with an object_table_add. */
-    return;
-  }
-  RAY_CHECK(reply->type != REDIS_REPLY_ERROR) << "reply->str is " << reply->str;
-  RAY_CHECK(strcmp(reply->str, "OK") == 0) << "reply->str is " << reply->str;
-  /* Call the done callback if there is one. */
-  if (callback_data->done_callback != NULL) {
-    object_table_done_callback done_callback =
-        (object_table_done_callback) callback_data->done_callback;
-    done_callback(callback_data->id, true, callback_data->user_context);
-  }
-  /* Clean up the timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_object_table_remove(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-
-  ObjectID obj_id = callback_data->id;
-  /* If the caller provided a manager ID to delete, use it. Otherwise, use our
-   * own client ID as the ID to delete. */
-  DBClientID *client_id = (DBClientID *) callback_data->data->Get();
-  if (client_id == NULL) {
-    client_id = &db->client;
-  }
-
-  redisAsyncContext *context = get_redis_context(db, obj_id);
-
-  int status = redisAsyncCommand(
-      context, redis_object_table_remove_callback,
-      (void *) callback_data->timer_id, "RAY.OBJECT_TABLE_REMOVE %b %b",
-      obj_id.data(), sizeof(obj_id), client_id->data(), sizeof(*client_id));
-
-  if ((status == REDIS_ERR) || context->err) {
-    LOG_REDIS_DEBUG(context, "error in redis_object_table_remove");
-  }
-}
-
-void redis_object_table_lookup(TableCallbackData *callback_data) {
-  RAY_CHECK(callback_data);
-  DBHandle *db = callback_data->db_handle;
-
-  ObjectID obj_id = callback_data->id;
-
-  redisAsyncContext *context = get_redis_context(db, obj_id);
-
-  int status = redisAsyncCommand(context, redis_object_table_lookup_callback,
-                                 (void *) callback_data->timer_id,
-                                 "RAY.OBJECT_TABLE_LOOKUP %b", obj_id.data(),
-                                 sizeof(obj_id));
-  if ((status == REDIS_ERR) || context->err) {
-    LOG_REDIS_DEBUG(context, "error in object_table lookup");
-  }
-}
-
-void redis_result_table_add_callback(redisAsyncContext *c,
-                                     void *r,
-                                     void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-  redisReply *reply = (redisReply *) r;
-  /* Check that the command succeeded. */
-  RAY_CHECK(reply->type != REDIS_REPLY_ERROR) << "reply->str is " << reply->str;
-  RAY_CHECK(strncmp(reply->str, "OK", strlen("OK")) == 0) << "reply->str is "
-                                                          << reply->str;
-  /* Call the done callback if there is one. */
-  if (callback_data->done_callback) {
-    result_table_done_callback done_callback =
-        (result_table_done_callback) callback_data->done_callback;
-    done_callback(callback_data->id, callback_data->user_context);
-  }
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_result_table_add(TableCallbackData *callback_data) {
-  RAY_CHECK(callback_data);
-  DBHandle *db = callback_data->db_handle;
-  ObjectID id = callback_data->id;
-  ResultTableAddInfo *info = (ResultTableAddInfo *) callback_data->data->Get();
-  int is_put = info->is_put ? 1 : 0;
-
-  redisAsyncContext *context = get_redis_context(db, id);
-
-  /* Add the result entry to the result table. */
-  int status =
-      redisAsyncCommand(context, redis_result_table_add_callback,
-                        (void *) callback_data->timer_id,
-                        "RAY.RESULT_TABLE_ADD %b %b %d", id.data(), sizeof(id),
-                        info->task_id.data(), sizeof(info->task_id), is_put);
-  if ((status == REDIS_ERR) || context->err) {
-    LOG_REDIS_DEBUG(context, "Error in result table add");
-  }
-}
-
-/* This allocates a task which must be freed by the caller, unless the returned
- * task is NULL. This is used by both redis_result_table_lookup_callback and
- * redis_task_table_get_task_callback. */
-Task *parse_and_construct_task_from_redis_reply(redisReply *reply) {
-  Task *task = NULL;
-  if (reply->type == REDIS_REPLY_NIL) {
-    /* There is no task in the reply, so return NULL. */
-  } else if (reply->type == REDIS_REPLY_STRING) {
-    /* The reply is a flatbuffer TaskReply object. Parse it and construct the
-     * task. */
-    auto message = flatbuffers::GetRoot<TaskReply>(reply->str);
-    TaskSpec *spec = (TaskSpec *) message->task_spec()->data();
-    int64_t task_spec_size = message->task_spec()->size();
-    auto execution_dependencies =
-        flatbuffers::GetRoot<TaskExecutionDependencies>(
-            message->execution_dependencies()->data());
-    task = Task_alloc(
-        spec, task_spec_size, static_cast<TaskStatus>(message->state()),
-        from_flatbuf(*message->local_scheduler_id()),
-        from_flatbuf(*execution_dependencies->execution_dependencies()));
-  } else {
-    RAY_LOG(FATAL) << "Unexpected reply type " << reply->type;
-  }
-  /* Return the task. If it is not NULL, then it must be freed by the caller. */
-  return task;
-}
-
-void redis_result_table_lookup_callback(redisAsyncContext *c,
-                                        void *r,
-                                        void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-  redisReply *reply = (redisReply *) r;
-  RAY_CHECK(reply->type == REDIS_REPLY_NIL || reply->type == REDIS_REPLY_STRING)
-      << "Unexpected reply type " << reply->type << " in "
-      << "redis_result_table_lookup_callback";
-  /* Parse the task from the reply. */
-  TaskID result_id = TaskID::nil();
-  bool is_put = false;
-  if (reply->type == REDIS_REPLY_STRING) {
-    auto message = flatbuffers::GetRoot<ResultTableReply>(reply->str);
-    result_id = from_flatbuf(*message->task_id());
-    is_put = message->is_put();
-  }
-
-  /* Call the done callback if there is one. */
-  result_table_lookup_callback done_callback =
-      (result_table_lookup_callback) callback_data->done_callback;
-  if (done_callback != NULL) {
-    done_callback(callback_data->id, result_id, is_put,
-                  callback_data->user_context);
-  }
-  /* Clean up timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_result_table_lookup(TableCallbackData *callback_data) {
-  RAY_CHECK(callback_data);
-  DBHandle *db = callback_data->db_handle;
-  ObjectID id = callback_data->id;
-  redisAsyncContext *context = get_redis_context(db, id);
-  int status =
-      redisAsyncCommand(context, redis_result_table_lookup_callback,
-                        (void *) callback_data->timer_id,
-                        "RAY.RESULT_TABLE_LOOKUP %b", id.data(), sizeof(id));
-  if ((status == REDIS_ERR) || context->err) {
-    LOG_REDIS_DEBUG(context, "Error in result table lookup");
-  }
-}
-
-DBClient redis_db_client_table_get(DBHandle *db,
-                                   const unsigned char *client_id,
-                                   size_t client_id_len) {
-  redisReply *reply =
-      (redisReply *) redisCommand(db->sync_context, "HGETALL %s%b",
-                                  DB_CLIENT_PREFIX, client_id, client_id_len);
-  RAY_CHECK(reply->type == REDIS_REPLY_ARRAY);
-  RAY_CHECK(reply->elements > 0);
-  DBClient db_client;
-  int num_fields = 0;
-  /* Parse the fields into a DBClient. */
-  for (size_t j = 0; j < reply->elements; j = j + 2) {
-    const char *key = reply->element[j]->str;
-    const char *value = reply->element[j + 1]->str;
-    if (strcmp(key, "ray_client_id") == 0) {
-      memcpy(db_client.id.mutable_data(), value, sizeof(db_client.id));
-      num_fields++;
-    } else if (strcmp(key, "client_type") == 0) {
-      db_client.client_type = std::string(value);
-      num_fields++;
-    } else if (strcmp(key, "manager_address") == 0) {
-      db_client.manager_address = std::string(value);
-      num_fields++;
-    } else if (strcmp(key, "deleted") == 0) {
-      bool is_deleted = atoi(value);
-      db_client.is_alive = !is_deleted;
-      num_fields++;
-    }
-  }
-  freeReplyObject(reply);
-  /* The client ID, type, and whether it is deleted are all
-   * mandatory fields. Auxiliary address is optional. */
-  RAY_CHECK(num_fields >= 3);
-  return db_client;
-}
-
-void redis_cache_set_db_client(DBHandle *db, DBClient client) {
-  db->db_client_cache[client.id] = client;
-}
-
-/**
- * Get an entry from the plasma manager table in redis.
- *
- * @param db The database handle.
- * @param index The index of the plasma manager.
- * @return The IP address and port of the manager.
- */
-DBClient redis_cache_get_db_client(DBHandle *db, DBClientID db_client_id) {
-  auto it = db->db_client_cache.find(db_client_id);
-  if (it == db->db_client_cache.end()) {
-    DBClient db_client = redis_db_client_table_get(db, db_client_id.data(),
-                                                   sizeof(db_client_id));
-    db->db_client_cache[db_client_id] = db_client;
-    it = db->db_client_cache.find(db_client_id);
-  }
-  return it->second;
-}
-
-void redis_object_table_lookup_callback(redisAsyncContext *c,
-                                        void *r,
-                                        void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-  redisReply *reply = (redisReply *) r;
-  RAY_LOG(DEBUG) << "Object table lookup callback";
-  RAY_CHECK(reply->type == REDIS_REPLY_NIL || reply->type == REDIS_REPLY_ARRAY);
-
-  object_table_lookup_done_callback done_callback =
-      (object_table_lookup_done_callback) callback_data->done_callback;
-
-  ObjectID obj_id = callback_data->id;
-
-  /* Parse the Redis reply. */
-  if (reply->type == REDIS_REPLY_NIL) {
-    /* The object entry did not exist. */
-    if (done_callback) {
-      done_callback(obj_id, true, std::vector<DBClientID>(),
-                    callback_data->user_context);
-    }
-  } else if (reply->type == REDIS_REPLY_ARRAY) {
-    /* Extract the manager IDs from the response into a vector. */
-    std::vector<DBClientID> manager_ids;
-
-    for (size_t j = 0; j < reply->elements; ++j) {
-      RAY_CHECK(reply->element[j]->type == REDIS_REPLY_STRING);
-      DBClientID manager_id;
-      memcpy(manager_id.mutable_data(), reply->element[j]->str,
-             sizeof(manager_id));
-      manager_ids.push_back(manager_id);
-    }
-
-    if (done_callback) {
-      done_callback(obj_id, false, manager_ids, callback_data->user_context);
-    }
-  } else {
-    RAY_LOG(FATAL) << "Unexpected reply type from object table lookup.";
-  }
-
-  /* Clean up timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void object_table_redis_subscribe_to_notifications_callback(
-    redisAsyncContext *c,
-    void *r,
-    void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  /* Replies to the SUBSCRIBE command have 3 elements. There are two
-   * possibilities. Either the reply is the initial acknowledgment of the
-   * subscribe command, or it is a message. If it is the initial acknowledgment,
-   * then
-   *     - reply->element[0]->str is "subscribe"
-   *     - reply->element[1]->str is the name of the channel
-   *     - reply->emement[2]->str is null.
-   * If it is an actual message, then
-   *     - reply->element[0]->str is "message"
-   *     - reply->element[1]->str is the name of the channel
-   *     - reply->emement[2]->str is the contents of the message.
-   */
-  redisReply *reply = (redisReply *) r;
-  RAY_CHECK(reply->type == REDIS_REPLY_ARRAY);
-  RAY_CHECK(reply->elements == 3);
-  redisReply *message_type = reply->element[0];
-  RAY_LOG(DEBUG) << "Object table subscribe to notifications callback, message"
-                 << message_type->str;
-
-  if (strcmp(message_type->str, "message") == 0) {
-    /* We received an object notification. Parse the payload. */
-    auto message = flatbuffers::GetRoot<SubscribeToNotificationsReply>(
-        reply->element[2]->str);
-    /* Extract the object ID. */
-    ObjectID obj_id = from_flatbuf(*message->object_id());
-    /* Extract the data size. */
-    int64_t data_size = message->object_size();
-    int manager_count = message->manager_ids()->size();
-
-    /* Extract the manager IDs from the response into a vector. */
-    std::vector<DBClientID> manager_ids;
-    for (int i = 0; i < manager_count; ++i) {
-      DBClientID manager_id = from_flatbuf(*message->manager_ids()->Get(i));
-      manager_ids.push_back(manager_id);
-    }
-
-    /* Call the subscribe callback. */
-    ObjectTableSubscribeData *data =
-        (ObjectTableSubscribeData *) callback_data->data->Get();
-    if (data->object_available_callback) {
-      data->object_available_callback(obj_id, data_size, manager_ids,
-                                      data->subscribe_context);
-    }
-  } else if (strcmp(message_type->str, "subscribe") == 0) {
-    /* The reply for the initial SUBSCRIBE command. */
-    /* Call the done callback if there is one. This code path should only be
-     * used in the tests. */
-    if (callback_data->done_callback != NULL) {
-      object_table_lookup_done_callback done_callback =
-          (object_table_lookup_done_callback) callback_data->done_callback;
-      done_callback(ray::UniqueID::nil(), false, std::vector<DBClientID>(),
-                    callback_data->user_context);
-    }
-    /* If the initial SUBSCRIBE was successful, clean up the timer, but don't
-     * destroy the callback data. */
-    remove_timer_callback(db->loop, callback_data);
-  } else {
-    RAY_LOG(FATAL) << "Unexpected reply type from object table subscribe to "
-                   << "notifications.";
-  }
-}
-
-void redis_object_table_subscribe_to_notifications(
-    TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  /* The object channel prefix must match the value defined in
-   * src/common/redismodule/ray_redis_module.cc. */
-  const char *object_channel_prefix = "OC:";
-  const char *object_channel_bcast = "BCAST";
-  for (size_t i = 0; i < db->subscribe_contexts.size(); ++i) {
-    int status = REDIS_OK;
-    /* Subscribe to notifications from the object table. This uses the client ID
-     * as the channel name so this channel is specific to this client.
-     * TODO(rkn):
-     * The channel name should probably be the client ID with some prefix. */
-    RAY_CHECK(callback_data->data->Get() != NULL)
-        << "Object table subscribe data passed as NULL.";
-    if (((ObjectTableSubscribeData *) (callback_data->data->Get()))
-            ->subscribe_all) {
-      /* Subscribe to the object broadcast channel. */
-      status = redisAsyncCommand(
-          db->subscribe_contexts[i],
-          object_table_redis_subscribe_to_notifications_callback,
-          (void *) callback_data->timer_id, "SUBSCRIBE %s%s",
-          object_channel_prefix, object_channel_bcast);
-    } else {
-      status = redisAsyncCommand(
-          db->subscribe_contexts[i],
-          object_table_redis_subscribe_to_notifications_callback,
-          (void *) callback_data->timer_id, "SUBSCRIBE %s%b",
-          object_channel_prefix, db->client.data(), sizeof(db->client));
-    }
-
-    if ((status == REDIS_ERR) || db->subscribe_contexts[i]->err) {
-      LOG_REDIS_DEBUG(db->subscribe_contexts[i],
-                      "error in redis_object_table_subscribe_to_notifications");
-    }
-  }
-}
-
-void redis_object_table_request_notifications_callback(redisAsyncContext *c,
-                                                       void *r,
-                                                       void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  /* Do some minimal checking. */
-  redisReply *reply = (redisReply *) r;
-  RAY_CHECK(reply->type != REDIS_REPLY_ERROR) << "reply->str is " << reply->str;
-  RAY_CHECK(strcmp(reply->str, "OK") == 0) << "reply->str is " << reply->str;
-  RAY_CHECK(callback_data->done_callback == NULL);
-  /* Clean up the timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_object_table_request_notifications(
-    TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-
-  ObjectTableRequestNotificationsData *request_data =
-      (ObjectTableRequestNotificationsData *) callback_data->data->Get();
-  int num_object_ids = request_data->num_object_ids;
-  ObjectID *object_ids = request_data->object_ids;
-
-  for (int i = 0; i < num_object_ids; ++i) {
-    redisAsyncContext *context = get_redis_context(db, object_ids[i]);
-
-    /* Create the arguments for the Redis command. */
-    int num_args = 1 + 1 + 1;
-    const char **argv = (const char **) malloc(sizeof(char *) * num_args);
-    size_t *argvlen = (size_t *) malloc(sizeof(size_t) * num_args);
-    /* Set the command name argument. */
-    argv[0] = "RAY.OBJECT_TABLE_REQUEST_NOTIFICATIONS";
-    argvlen[0] = strlen(argv[0]);
-    /* Set the client ID argument. */
-    argv[1] = (char *) db->client.data();
-    argvlen[1] = sizeof(db->client);
-    /* Set the object ID arguments. */
-    argv[2] = (char *) object_ids[i].data();
-    argvlen[2] = sizeof(object_ids[i]);
-
-    int status = redisAsyncCommandArgv(
-        context, redis_object_table_request_notifications_callback,
-        (void *) callback_data->timer_id, num_args, argv, argvlen);
-    free(argv);
-    free(argvlen);
-
-    if ((status == REDIS_ERR) || context->err) {
-      LOG_REDIS_DEBUG(context,
-                      "error in redis_object_table_subscribe_to_notifications");
-    }
-  }
-}
-
-/*
- *  ==== task_table callbacks ====
- */
-
-void redis_task_table_get_task_callback(redisAsyncContext *c,
-                                        void *r,
-                                        void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-  redisReply *reply = (redisReply *) r;
-  /* Parse the task from the reply. */
-  Task *task = parse_and_construct_task_from_redis_reply(reply);
-  /* Call the done callback if there is one. */
-  task_table_get_callback done_callback =
-      (task_table_get_callback) callback_data->done_callback;
-  if (done_callback != NULL) {
-    done_callback(task, callback_data->user_context);
-  }
-  /* Free the task if it is not NULL. */
-  if (task != NULL) {
-    Task_free(task);
-  }
-
-  /* Clean up the timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_task_table_get_task(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  RAY_CHECK(callback_data->data->Get() == NULL);
-  TaskID task_id = callback_data->id;
-
-  redisAsyncContext *context = get_redis_context(db, task_id);
-
-  int status = redisAsyncCommand(context, redis_task_table_get_task_callback,
-                                 (void *) callback_data->timer_id,
-                                 "RAY.TASK_TABLE_GET %b", task_id.data(),
-                                 sizeof(task_id));
-  if ((status == REDIS_ERR) || context->err) {
-    LOG_REDIS_DEBUG(context, "error in redis_task_table_get_task");
-  }
-}
-
-void redis_task_table_add_task_callback(redisAsyncContext *c,
-                                        void *r,
-                                        void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  redisReply *reply = (redisReply *) r;
-  // If no subscribers received the message, call the failure callback. The
-  // caller should decide whether to retry the add. NOTE(swang): The caller
-  // should check whether the receiving subscriber is still alive in the
-  // db_client table before retrying the add.
-  if (reply->type == REDIS_REPLY_ERROR &&
-      strcmp(reply->str, "No subscribers received message.") == 0) {
-    RAY_LOG(WARNING) << "No subscribers received the task_table_add message.";
-    if (callback_data->retry.fail_callback != NULL) {
-      callback_data->retry.fail_callback(callback_data->id,
-                                         callback_data->user_context,
-                                         callback_data->data->Get());
-    }
-  } else {
-    RAY_CHECK(reply->type != REDIS_REPLY_ERROR) << "reply->str is "
-                                                << reply->str;
-    RAY_CHECK(strcmp(reply->str, "OK") == 0) << "reply->str is " << reply->str;
-    /* Call the done callback if there is one. */
-    if (callback_data->done_callback != NULL) {
-      task_table_done_callback done_callback =
-          (task_table_done_callback) callback_data->done_callback;
-      done_callback(callback_data->id, callback_data->user_context);
-    }
-  }
-
-  /* Clean up the timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_task_table_add_task(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  Task *task = (Task *) callback_data->data->Get();
-  RAY_CHECK(task != NULL) << "NULL task passed to redis_task_table_add_task.";
-
-  TaskID task_id = Task_task_id(task);
-  DBClientID local_scheduler_id = Task_local_scheduler(task);
-  redisAsyncContext *context = get_redis_context(db, task_id);
-  int state = static_cast<int>(Task_state(task));
-
-  TaskExecutionSpec *execution_spec = Task_task_execution_spec(task);
-  TaskSpec *spec = execution_spec->Spec();
-
-  flatbuffers::FlatBufferBuilder fbb;
-  auto execution_dependencies = CreateTaskExecutionDependencies(
-      fbb, to_flatbuf(fbb, execution_spec->ExecutionDependencies()));
-  fbb.Finish(execution_dependencies);
-
-  int status = redisAsyncCommand(
-      context, redis_task_table_add_task_callback,
-      (void *) callback_data->timer_id, "RAY.TASK_TABLE_ADD %b %d %b %b %d %b",
-      task_id.data(), sizeof(task_id), state, local_scheduler_id.data(),
-      sizeof(local_scheduler_id), fbb.GetBufferPointer(),
-      (size_t) fbb.GetSize(),
-      static_cast<int>(execution_spec->SpillbackCount()), spec,
-      execution_spec->SpecSize());
-  if ((status == REDIS_ERR) || context->err) {
-    LOG_REDIS_DEBUG(context, "error in redis_task_table_add_task");
-  }
-}
-
-void redis_task_table_update_callback(redisAsyncContext *c,
-                                      void *r,
-                                      void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  redisReply *reply = (redisReply *) r;
-  // If no subscribers received the message, call the failure callback. The
-  // caller should decide whether to retry the update. NOTE(swang): Retrying a
-  // task table update can race with the liveness monitor. Do not retry the
-  // update unless the caller is sure that the receiving subscriber is still
-  // alive in the db_client table.
-  if (reply->type == REDIS_REPLY_ERROR) {
-    RAY_LOG(WARNING) << "task_table_update failed with " << reply->str;
-    if (callback_data->retry.fail_callback != NULL) {
-      callback_data->retry.fail_callback(callback_data->id,
-                                         callback_data->user_context,
-                                         callback_data->data->Get());
-    } else {
-      RAY_LOG(FATAL) << "task_table_update failed and no fail_callback is set";
-    }
-  } else {
-    RAY_CHECK(strcmp(reply->str, "OK") == 0) << "reply->str is " << reply->str;
-
-    /* Call the done callback if there is one. */
-    if (callback_data->done_callback != NULL) {
-      task_table_done_callback done_callback =
-          (task_table_done_callback) callback_data->done_callback;
-      done_callback(callback_data->id, callback_data->user_context);
-    }
-  }
-
-  /* Clean up the timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_task_table_update(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  Task *task = (Task *) callback_data->data->Get();
-  RAY_CHECK(task != NULL) << "NULL task passed to redis_task_table_update.";
-
-  TaskID task_id = Task_task_id(task);
-  redisAsyncContext *context = get_redis_context(db, task_id);
-  DBClientID local_scheduler_id = Task_local_scheduler(task);
-  int state = static_cast<int>(Task_state(task));
-
-  TaskExecutionSpec *execution_spec = Task_task_execution_spec(task);
-  flatbuffers::FlatBufferBuilder fbb;
-  auto execution_dependencies = CreateTaskExecutionDependencies(
-      fbb, to_flatbuf(fbb, execution_spec->ExecutionDependencies()));
-  fbb.Finish(execution_dependencies);
-
-  int status = redisAsyncCommand(
-      context, redis_task_table_update_callback,
-      (void *) callback_data->timer_id, "RAY.TASK_TABLE_UPDATE %b %d %b %b %d",
-      task_id.data(), sizeof(task_id), state, local_scheduler_id.data(),
-      sizeof(local_scheduler_id), fbb.GetBufferPointer(),
-      (size_t) fbb.GetSize(),
-      static_cast<int>(execution_spec->SpillbackCount()));
-  if ((status == REDIS_ERR) || context->err) {
-    LOG_REDIS_DEBUG(context, "error in redis_task_table_update");
-  }
-}
-
-void redis_task_table_test_and_update_callback(redisAsyncContext *c,
-                                               void *r,
-                                               void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-  redisReply *reply = (redisReply *) r;
-  /* Parse the task from the reply. */
-  Task *task = parse_and_construct_task_from_redis_reply(reply);
-  if (task == NULL) {
-    /* A NULL task means that the task was not in the task table. NOTE(swang):
-     * For normal tasks, this is not expected behavior, but actor tasks may be
-     * delayed when added to the task table if they are submitted to a local
-     * scheduler before it receives the notification that maps the actor to a
-     * local scheduler. */
-    RAY_LOG(ERROR) << "No task found during task_table_test_and_update for "
-                   << "task with ID " << callback_data->id;
-    return;
-  }
-  /* Determine whether the update happened. */
-  auto message = flatbuffers::GetRoot<TaskReply>(reply->str);
-  bool updated = message->updated();
-
-  /* Call the done callback if there is one. */
-  task_table_test_and_update_callback done_callback =
-      (task_table_test_and_update_callback) callback_data->done_callback;
-  if (done_callback != NULL) {
-    done_callback(task, callback_data->user_context, updated);
-  }
-  /* Free the task if it is not NULL. */
-  if (task != NULL) {
-    Task_free(task);
-  }
-  /* Clean up timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_task_table_test_and_update(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  TaskID task_id = callback_data->id;
-  redisAsyncContext *context = get_redis_context(db, task_id);
-  TaskTableTestAndUpdateData *update_data =
-      (TaskTableTestAndUpdateData *) callback_data->data->Get();
-
-  int status;
-  /* If the test local scheduler ID is NIL, then ignore it. */
-  if (update_data->test_local_scheduler_id.is_nil()) {
-    status = redisAsyncCommand(
-        context, redis_task_table_test_and_update_callback,
-        (void *) callback_data->timer_id,
-        "RAY.TASK_TABLE_TEST_AND_UPDATE %b %d %d %b", task_id.data(),
-        sizeof(task_id), update_data->test_state_bitmask,
-        update_data->update_state, update_data->local_scheduler_id.data(),
-        sizeof(update_data->local_scheduler_id));
-  } else {
-    status = redisAsyncCommand(
-        context, redis_task_table_test_and_update_callback,
-        (void *) callback_data->timer_id,
-        "RAY.TASK_TABLE_TEST_AND_UPDATE %b %d %d %b %b", task_id.data(),
-        sizeof(task_id), update_data->test_state_bitmask,
-        update_data->update_state, update_data->local_scheduler_id.data(),
-        sizeof(update_data->local_scheduler_id),
-        update_data->test_local_scheduler_id.data(),
-        sizeof(update_data->test_local_scheduler_id));
-  }
-
-  if ((status == REDIS_ERR) || context->err) {
-    LOG_REDIS_DEBUG(context, "error in redis_task_table_test_and_update");
-  }
-}
-
-void redis_task_table_subscribe_callback(redisAsyncContext *c,
-                                         void *r,
-                                         void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-  redisReply *reply = (redisReply *) r;
-
-  RAY_CHECK(reply->type == REDIS_REPLY_ARRAY);
-  /* The number of elements is 3 for a reply to SUBSCRIBE, and 4 for a reply to
-   * PSUBSCRIBE. */
-  RAY_CHECK(reply->elements == 3 || reply->elements == 4)
-      << "reply->elements is " << reply->elements;
-  /* The first element is the message type and the last entry is the payload.
-   * The middle one or middle two elements describe the channel that was
-   * published on. */
-  redisReply *message_type = reply->element[0];
-  redisReply *payload = reply->element[reply->elements - 1];
-  if (strcmp(message_type->str, "message") == 0 ||
-      strcmp(message_type->str, "pmessage") == 0) {
-    /* Handle a task table event. Parse the payload and call the callback. */
-    auto message = flatbuffers::GetRoot<TaskReply>(payload->str);
-    /* Extract the scheduling state. */
-    TaskStatus state = static_cast<TaskStatus>(message->state());
-    /* Extract the local scheduler ID. */
-    DBClientID local_scheduler_id =
-        from_flatbuf(*message->local_scheduler_id());
-    /* Extract the execution dependencies. */
-    auto execution_dependencies =
-        flatbuffers::GetRoot<TaskExecutionDependencies>(
-            message->execution_dependencies()->data());
-    /* Extract the task spec. */
-    TaskSpec *spec = (TaskSpec *) message->task_spec()->data();
-    int64_t task_spec_size = message->task_spec()->size();
-    /* Extract the spillback information. */
-    int spillback_count = message->spillback_count();
-    /* Create a task. */
-    /* Allocate the task execution spec on the stack and use it to construct
-     * the task.
-     */
-    TaskExecutionSpec execution_spec(
-        from_flatbuf(*execution_dependencies->execution_dependencies()), spec,
-        task_spec_size, spillback_count);
-    Task *task = Task_alloc(execution_spec, state, local_scheduler_id);
-
-    /* Call the subscribe callback if there is one. */
-    TaskTableSubscribeData *data =
-        (TaskTableSubscribeData *) callback_data->data->Get();
-    if (data->subscribe_callback != NULL) {
-      data->subscribe_callback(task, data->subscribe_context);
-    }
-    Task_free(task);
-  } else if (strcmp(message_type->str, "subscribe") == 0 ||
-             strcmp(message_type->str, "psubscribe") == 0) {
-    /* If this condition is true, we got the initial message that acknowledged
-     * the subscription. */
-    if (callback_data->done_callback != NULL) {
-      task_table_done_callback done_callback =
-          (task_table_done_callback) callback_data->done_callback;
-      done_callback(callback_data->id, callback_data->user_context);
-    }
-    /* Note that we do not destroy the callback data yet because the
-     * subscription callback needs this data. */
-    remove_timer_callback(db->loop, callback_data);
-  } else {
-    RAY_LOG(FATAL) << "Unexpected reply type from task table subscribe. "
-                   << "Message type is " << message_type->str;
-  }
-}
-
-void redis_task_table_subscribe(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  TaskTableSubscribeData *data =
-      (TaskTableSubscribeData *) callback_data->data->Get();
-  /* TASK_CHANNEL_PREFIX is defined in ray_redis_module.cc and must be kept in
-   * sync with that file. */
-  const char *TASK_CHANNEL_PREFIX = "TT:";
-  /* In the new code path, subscriptions currently go through the
-   * primary redis shard. */
-  for (auto subscribe_context : db->subscribe_contexts) {
-    int status;
-    if (data->local_scheduler_id.is_nil()) {
-      /* TODO(swang): Implement the state_filter by translating the bitmask into
-       * a Redis key-matching pattern. */
-      status = redisAsyncCommand(
-          subscribe_context, redis_task_table_subscribe_callback,
-          (void *) callback_data->timer_id, "PSUBSCRIBE %s*:%d",
-          TASK_CHANNEL_PREFIX, data->state_filter);
-    } else {
-      DBClientID local_scheduler_id = data->local_scheduler_id;
-      status = redisAsyncCommand(
-          subscribe_context, redis_task_table_subscribe_callback,
-          (void *) callback_data->timer_id, "SUBSCRIBE %s%b:%d",
-          TASK_CHANNEL_PREFIX, (char *) local_scheduler_id.data(),
-          sizeof(local_scheduler_id), data->state_filter);
-    }
-    if ((status == REDIS_ERR) || subscribe_context->err) {
-      LOG_REDIS_DEBUG(subscribe_context, "error in redis_task_table_subscribe");
-    }
-  }
-}
-
-/*
- *  ==== db client table callbacks ====
- */
-
-void redis_db_client_table_remove_callback(redisAsyncContext *c,
-                                           void *r,
-                                           void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-  redisReply *reply = (redisReply *) r;
-
-  RAY_CHECK(reply->type != REDIS_REPLY_ERROR) << "reply->str is " << reply->str;
-  RAY_CHECK(strcmp(reply->str, "OK") == 0) << "reply->str is " << reply->str;
-
-  /* Call the done callback if there is one. */
-  db_client_table_done_callback done_callback =
-      (db_client_table_done_callback) callback_data->done_callback;
-  if (done_callback) {
-    done_callback(callback_data->id, callback_data->user_context);
-  }
-  /* Clean up the timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_db_client_table_remove(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  int status =
-      redisAsyncCommand(db->context, redis_db_client_table_remove_callback,
-                        (void *) callback_data->timer_id, "RAY.DISCONNECT %b",
-                        callback_data->id.data(), sizeof(callback_data->id));
-  if ((status == REDIS_ERR) || db->context->err) {
-    LOG_REDIS_DEBUG(db->context, "error in db_client_table_remove");
-  }
-}
-
-void redis_db_client_table_scan(DBHandle *db,
-                                std::vector<DBClient> &db_clients) {
-  /* TODO(swang): Integrate this functionality with the Ray Redis module. To do
-   * this, we need the KEYS or SCAN command in Redis modules. */
-  /* Get all the database client keys. */
-  redisReply *reply = (redisReply *) redisCommand(db->sync_context, "KEYS %s*",
-                                                  DB_CLIENT_PREFIX);
-  if (reply->type == REDIS_REPLY_NIL) {
-    return;
-  }
-  /* Get all the database client information. */
-  RAY_CHECK(reply->type == REDIS_REPLY_ARRAY);
-  for (size_t i = 0; i < reply->elements; ++i) {
-    /* Strip the database client table prefix. */
-    unsigned char *key = (unsigned char *) reply->element[i]->str;
-    key += strlen(DB_CLIENT_PREFIX);
-    size_t key_len = reply->element[i]->len;
-    key_len -= strlen(DB_CLIENT_PREFIX);
-    /* Get the database client's information. */
-    DBClient db_client = redis_db_client_table_get(db, key, key_len);
-    db_clients.push_back(db_client);
-  }
-  freeReplyObject(reply);
-}
-
-void redis_db_client_table_subscribe_callback(redisAsyncContext *c,
-                                              void *r,
-                                              void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-  redisReply *reply = (redisReply *) r;
-
-  RAY_CHECK(reply->type == REDIS_REPLY_ARRAY);
-  RAY_CHECK(reply->elements > 2);
-  /* First entry is message type, then possibly the regex we psubscribed to,
-   * then topic, then payload. */
-  redisReply *payload = reply->element[reply->elements - 1];
-  /* If this condition is true, we got the initial message that acknowledged the
-   * subscription. */
-  if (payload->str == NULL) {
-    if (callback_data->done_callback) {
-      db_client_table_done_callback done_callback =
-          (db_client_table_done_callback) callback_data->done_callback;
-      done_callback(callback_data->id, callback_data->user_context);
-    }
-    /* Note that we do not destroy the callback data yet because the
-     * subscription callback needs this data. */
-    remove_timer_callback(db->loop, callback_data);
-
-    /* Get the current db client table entries, in case we missed notifications
-     * before the initial subscription. This must be done before we process any
-     * notifications from the subscription channel, so that we don't readd an
-     * entry that has already been deleted. */
-    std::vector<DBClient> db_clients;
-    redis_db_client_table_scan(db, db_clients);
-    /* Call the subscription callback for all entries that we missed. */
-    DBClientTableSubscribeData *data =
-        (DBClientTableSubscribeData *) callback_data->data->Get();
-    for (auto db_client : db_clients) {
-      data->subscribe_callback(&db_client, data->subscribe_context);
-    }
-    return;
-  }
-  /* Otherwise, parse the payload and call the callback. */
-  auto message =
-      flatbuffers::GetRoot<SubscribeToDBClientTableReply>(payload->str);
-
-  /* Parse the client type and auxiliary address from the response. If there is
-   * only client type, then the update was a delete. */
-  DBClient db_client;
-  db_client.id = from_flatbuf(*message->db_client_id());
-  db_client.client_type = std::string(message->client_type()->data());
-  db_client.manager_address = std::string(message->manager_address()->data());
-  db_client.is_alive = message->is_insertion();
-
-  /* Call the subscription callback. */
-  DBClientTableSubscribeData *data =
-      (DBClientTableSubscribeData *) callback_data->data->Get();
-  if (data->subscribe_callback) {
-    data->subscribe_callback(&db_client, data->subscribe_context);
-  }
-}
-
-void redis_db_client_table_subscribe(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  int status = redisAsyncCommand(
-      db->subscribe_context, redis_db_client_table_subscribe_callback,
-      (void *) callback_data->timer_id, "SUBSCRIBE db_clients");
-  if ((status == REDIS_ERR) || db->subscribe_context->err) {
-    LOG_REDIS_DEBUG(db->subscribe_context,
-                    "error in db_client_table_register_callback");
-  }
-}
-
-void redis_local_scheduler_table_subscribe_callback(redisAsyncContext *c,
-                                                    void *r,
-                                                    void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  redisReply *reply = (redisReply *) r;
-  RAY_CHECK(reply->type == REDIS_REPLY_ARRAY);
-  RAY_CHECK(reply->elements == 3);
-  redisReply *message_type = reply->element[0];
-  RAY_LOG(DEBUG) << "Local scheduler table subscribe callback, message "
-                 << message_type->str;
-
-  if (strcmp(message_type->str, "message") == 0) {
-    /* Handle a local scheduler heartbeat. Parse the payload and call the
-     * subscribe callback. */
-    auto message =
-        flatbuffers::GetRoot<LocalSchedulerInfoMessage>(reply->element[2]->str);
-
-    /* Extract the client ID. */
-    DBClientID client_id = from_flatbuf(*message->db_client_id());
-    /* Extract the fields of the local scheduler info struct. */
-    LocalSchedulerInfo info;
-    if (message->is_dead()) {
-      /* If the local scheduler is dead, then ignore all other fields in the
-       * message. */
-      info.is_dead = true;
-    } else {
-      /* If the local scheduler is alive, collect load information. */
-      info.is_dead = false;
-      info.total_num_workers = message->total_num_workers();
-      info.task_queue_length = message->task_queue_length();
-      info.available_workers = message->available_workers();
-
-      info.static_resources = map_from_flatbuf(*message->static_resources());
-      info.dynamic_resources = map_from_flatbuf(*message->dynamic_resources());
-    }
-
-    /* Call the subscribe callback. */
-    LocalSchedulerTableSubscribeData *data =
-        (LocalSchedulerTableSubscribeData *) callback_data->data->Get();
-    if (data->subscribe_callback) {
-      data->subscribe_callback(client_id, info, data->subscribe_context);
-    }
-  } else if (strcmp(message_type->str, "subscribe") == 0) {
-    /* The reply for the initial SUBSCRIBE command. */
-    RAY_CHECK(callback_data->done_callback == NULL);
-    /* If the initial SUBSCRIBE was successful, clean up the timer, but don't
-     * destroy the callback data. */
-    remove_timer_callback(db->loop, callback_data);
-
-  } else {
-    RAY_LOG(FATAL) << "Unexpected reply type from local scheduler subscribe.";
-  }
-}
-
-void redis_local_scheduler_table_subscribe(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  int status = redisAsyncCommand(
-      db->subscribe_context, redis_local_scheduler_table_subscribe_callback,
-      (void *) callback_data->timer_id, "SUBSCRIBE local_schedulers");
-  if ((status == REDIS_ERR) || db->subscribe_context->err) {
-    LOG_REDIS_DEBUG(db->subscribe_context,
-                    "error in redis_local_scheduler_table_subscribe");
-  }
-}
-
-void redis_local_scheduler_table_send_info_callback(redisAsyncContext *c,
-                                                    void *r,
-                                                    void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  redisReply *reply = (redisReply *) r;
-  RAY_CHECK(reply->type == REDIS_REPLY_INTEGER);
-  RAY_LOG(DEBUG) << reply->integer << " subscribers received this publish.";
-
-  RAY_CHECK(callback_data->done_callback == NULL);
-  /* Clean up the timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_local_scheduler_table_send_info(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  LocalSchedulerTableSendInfoData *data =
-      (LocalSchedulerTableSendInfoData *) callback_data->data->Get();
-
-  int64_t size = data->size;
-  uint8_t *flatbuffer_data = data->flatbuffer_data;
-
-  int status = redisAsyncCommand(
-      db->context, redis_local_scheduler_table_send_info_callback,
-      (void *) callback_data->timer_id, "PUBLISH local_schedulers %b",
-      flatbuffer_data, size);
-  if ((status == REDIS_ERR) || db->context->err) {
-    LOG_REDIS_DEBUG(db->context,
-                    "error in redis_local_scheduler_table_send_info");
-  }
-}
-
-void redis_local_scheduler_table_disconnect(DBHandle *db) {
-  flatbuffers::FlatBufferBuilder fbb;
-  /* Create the flatbuffers message. */
-  std::unordered_map<std::string, double> empty_resource_map;
-  /* Most of the flatbuffer message fields don't matter here. Only the
-   * db_client_id and the is_dead field matter. */
-  auto message = CreateLocalSchedulerInfoMessage(
-      fbb, to_flatbuf(fbb, db->client), 0, 0, 0,
-      map_to_flatbuf(fbb, empty_resource_map),
-      map_to_flatbuf(fbb, empty_resource_map), true);
-  fbb.Finish(message);
-
-  redisReply *reply = (redisReply *) redisCommand(
-      db->sync_context, "PUBLISH local_schedulers %b", fbb.GetBufferPointer(),
-      (size_t) fbb.GetSize());
-  RAY_CHECK(reply->type != REDIS_REPLY_ERROR) << "reply->str is " << reply->str;
-  RAY_CHECK(reply->type == REDIS_REPLY_INTEGER);
-  RAY_LOG(DEBUG) << reply->integer << " subscribers received this publish.";
-  freeReplyObject(reply);
-}
-
-void redis_driver_table_subscribe_callback(redisAsyncContext *c,
-                                           void *r,
-                                           void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  redisReply *reply = (redisReply *) r;
-  RAY_CHECK(reply->type == REDIS_REPLY_ARRAY);
-  RAY_CHECK(reply->elements == 3);
-  redisReply *message_type = reply->element[0];
-  RAY_LOG(DEBUG) << "Driver table subscribe callback, message "
-                 << message_type->str;
-
-  if (strcmp(message_type->str, "message") == 0) {
-    /* Handle a driver heartbeat. Parse the payload and call the subscribe
-     * callback. */
-    auto message =
-        flatbuffers::GetRoot<DriverTableMessage>(reply->element[2]->str);
-    /* Extract the client ID. */
-    WorkerID driver_id = from_flatbuf(*message->driver_id());
-
-    /* Call the subscribe callback. */
-    DriverTableSubscribeData *data =
-        (DriverTableSubscribeData *) callback_data->data->Get();
-    if (data->subscribe_callback) {
-      data->subscribe_callback(driver_id, data->subscribe_context);
-    }
-  } else if (strcmp(message_type->str, "subscribe") == 0) {
-    /* The reply for the initial SUBSCRIBE command. */
-    RAY_CHECK(callback_data->done_callback == NULL);
-    /* If the initial SUBSCRIBE was successful, clean up the timer, but don't
-     * destroy the callback data. */
-    remove_timer_callback(db->loop, callback_data);
-
-  } else {
-    RAY_LOG(FATAL) << "Unexpected reply type from driver subscribe.";
-  }
-}
-
-void redis_driver_table_subscribe(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  int status = redisAsyncCommand(
-      db->subscribe_context, redis_driver_table_subscribe_callback,
-      (void *) callback_data->timer_id, "SUBSCRIBE driver_deaths");
-  if ((status == REDIS_ERR) || db->subscribe_context->err) {
-    LOG_REDIS_DEBUG(db->subscribe_context,
-                    "error in redis_driver_table_subscribe");
-  }
-}
-
-void redis_driver_table_send_driver_death_callback(redisAsyncContext *c,
-                                                   void *r,
-                                                   void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  redisReply *reply = (redisReply *) r;
-  RAY_CHECK(reply->type == REDIS_REPLY_INTEGER);
-  RAY_LOG(DEBUG) << reply->integer << " subscribers received this publish.";
-  /* At the very least, the local scheduler that publishes this message should
-   * also receive it. */
-  RAY_CHECK(reply->integer >= 1);
-
-  RAY_CHECK(callback_data->done_callback == NULL);
-  /* Clean up the timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_driver_table_send_driver_death(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  WorkerID driver_id = callback_data->id;
-
-  /* Create a flatbuffer object to serialize and publish. */
-  flatbuffers::FlatBufferBuilder fbb;
-  /* Create the flatbuffers message. */
-  auto message = CreateDriverTableMessage(fbb, to_flatbuf(fbb, driver_id));
-  fbb.Finish(message);
-
-  int status = redisAsyncCommand(
-      db->context, redis_driver_table_send_driver_death_callback,
-      (void *) callback_data->timer_id, "PUBLISH driver_deaths %b",
-      fbb.GetBufferPointer(), (size_t) fbb.GetSize());
-  if ((status == REDIS_ERR) || db->context->err) {
-    LOG_REDIS_DEBUG(db->context,
-                    "error in redis_driver_table_send_driver_death");
-  }
-}
-
-void redis_plasma_manager_send_heartbeat(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  /* NOTE(swang): We purposefully do not provide a callback, leaving the table
-   * operation and timer active. This allows us to send a new heartbeat every
-   * heartbeat_timeout_milliseconds without having to allocate and deallocate
-   * memory for callback data each time. */
-  int status = redisAsyncCommand(
-      db->context, NULL, (void *) callback_data->timer_id,
-      "PUBLISH plasma_managers %b", db->client.data(), sizeof(db->client));
-  if ((status == REDIS_ERR) || db->context->err) {
-    LOG_REDIS_DEBUG(db->context,
-                    "error in redis_plasma_manager_send_heartbeat");
-  }
-  /* Clean up the timer and callback. */
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_publish_actor_creation_notification_callback(redisAsyncContext *c,
-                                                        void *r,
-                                                        void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  redisReply *reply = (redisReply *) r;
-  RAY_CHECK(reply->type == REDIS_REPLY_INTEGER);
-  RAY_LOG(DEBUG) << reply->integer << " subscribers received this publish.";
-  // At the very least, the local scheduler that publishes this message should
-  // also receive it.
-  RAY_CHECK(reply->integer >= 1);
-
-  RAY_CHECK(callback_data->done_callback == NULL);
-  // Clean up the timer and callback.
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_publish_actor_creation_notification(
-    TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-
-  ActorCreationNotificationData *data =
-      (ActorCreationNotificationData *) callback_data->data->Get();
-
-  int status = redisAsyncCommand(
-      db->context, redis_publish_actor_creation_notification_callback,
-      (void *) callback_data->timer_id, "PUBLISH actor_notifications %b",
-      &data->flatbuffer_data[0], data->size);
-  if ((status == REDIS_ERR) || db->context->err) {
-    LOG_REDIS_DEBUG(db->context,
-                    "error in redis_publish_actor_creation_notification");
-  }
-}
-
-void redis_actor_notification_table_subscribe_callback(redisAsyncContext *c,
-                                                       void *r,
-                                                       void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-
-  redisReply *reply = (redisReply *) r;
-  RAY_CHECK(reply->type == REDIS_REPLY_ARRAY);
-  RAY_CHECK(reply->elements == 3);
-  redisReply *message_type = reply->element[0];
-  RAY_LOG(DEBUG) << "Local scheduler table subscribe callback, message "
-                 << message_type->str;
-
-  if (strcmp(message_type->str, "message") == 0) {
-    // Handle an actor notification message. Parse the payload and call the
-    // subscribe callback.
-    redisReply *payload = reply->element[2];
-    ActorNotificationTableSubscribeData *data =
-        (ActorNotificationTableSubscribeData *) callback_data->data->Get();
-
-    auto message =
-        flatbuffers::GetRoot<ActorCreationNotification>(payload->str);
-    ActorID actor_id = from_flatbuf(*message->actor_id());
-    WorkerID driver_id = from_flatbuf(*message->driver_id());
-    DBClientID local_scheduler_id =
-        from_flatbuf(*message->local_scheduler_id());
-
-    if (data->subscribe_callback) {
-      data->subscribe_callback(actor_id, driver_id, local_scheduler_id,
-                               data->subscribe_context);
-    }
-  } else if (strcmp(message_type->str, "subscribe") == 0) {
-    /* The reply for the initial SUBSCRIBE command. */
-    RAY_CHECK(callback_data->done_callback == NULL);
-    /* If the initial SUBSCRIBE was successful, clean up the timer, but don't
-     * destroy the callback data. */
-    remove_timer_callback(db->loop, callback_data);
-
-  } else {
-    RAY_LOG(FATAL) << "Unexpected reply type from actor notification "
-                   << "subscribe.";
-  }
-}
-
-void redis_actor_notification_table_subscribe(
-    TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  int status = redisAsyncCommand(
-      db->subscribe_context, redis_actor_notification_table_subscribe_callback,
-      (void *) callback_data->timer_id, "SUBSCRIBE actor_notifications");
-  if ((status == REDIS_ERR) || db->subscribe_context->err) {
-    LOG_REDIS_DEBUG(db->subscribe_context,
-                    "error in redis_actor_notification_table_subscribe");
-  }
-}
-
-void redis_actor_table_mark_removed(DBHandle *db, ActorID actor_id) {
-  int status =
-      redisAsyncCommand(db->context, NULL, NULL, "HSET Actor:%b removed \"1\"",
-                        actor_id.data(), sizeof(actor_id));
-  if ((status == REDIS_ERR) || db->subscribe_context->err) {
-    LOG_REDIS_DEBUG(db->context, "error in redis_actor_table_mark_removed");
-  }
-}
-
-void redis_push_error_rpush_callback(redisAsyncContext *c,
-                                     void *r,
-                                     void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-  redisReply *reply = (redisReply *) r;
-  /* The reply should be the length of the errors list after our RPUSH. */
-  RAY_CHECK(reply->type == REDIS_REPLY_INTEGER);
-  destroy_timer_callback(db->loop, callback_data);
-}
-
-void redis_push_error_hmset_callback(redisAsyncContext *c,
-                                     void *r,
-                                     void *privdata) {
-  REDIS_CALLBACK_HEADER(db, callback_data, r);
-  redisReply *reply = (redisReply *) r;
-
-  /* Make sure we were able to add the error information. */
-  RAY_CHECK(reply->type != REDIS_REPLY_ERROR) << "reply->str is " << reply->str;
-  RAY_CHECK(strcmp(reply->str, "OK") == 0) << "reply->str is " << reply->str;
-
-  /* Add the error to this driver's list of errors. */
-  ErrorInfo *info = (ErrorInfo *) callback_data->data->Get();
-  int status = redisAsyncCommand(
-      db->context, redis_push_error_rpush_callback,
-      (void *) callback_data->timer_id, "RPUSH ErrorKeys Error:%b:%b",
-      info->driver_id.data(), sizeof(info->driver_id), info->error_key.data(),
-      sizeof(info->error_key));
-  if ((status == REDIS_ERR) || db->subscribe_context->err) {
-    LOG_REDIS_DEBUG(db->subscribe_context, "error in redis_push_error rpush");
-  }
-}
-
-void redis_push_error(TableCallbackData *callback_data) {
-  DBHandle *db = callback_data->db_handle;
-  ErrorInfo *info = (ErrorInfo *) callback_data->data->Get();
-  RAY_CHECK(info->error_type < ErrorIndex::MAX &&
-            info->error_type >= ErrorIndex::OBJECT_HASH_MISMATCH);
-  /// Look up the error type.
-  const char *error_type = error_types[static_cast<int>(info->error_type)];
-
-  /* Set the error information. */
-  int status = redisAsyncCommand(
-      db->context, redis_push_error_hmset_callback,
-      (void *) callback_data->timer_id,
-      "HMSET Error:%b:%b type %s message %b data %b", info->driver_id.data(),
-      sizeof(info->driver_id), info->error_key.data(), sizeof(info->error_key),
-      error_type, info->error_message, info->size, "None", strlen("None"));
-  if ((status == REDIS_ERR) || db->subscribe_context->err) {
-    LOG_REDIS_DEBUG(db->subscribe_context, "error in redis_push_error hmset");
-  }
-}
-
-DBClientID get_db_client_id(DBHandle *db) {
-  RAY_CHECK(db != NULL);
-  return db->client;
-}
diff --git a/src/common/state/redis.h b/src/common/state/redis.h
deleted file mode 100644
index 164069740d3e1..0000000000000
--- a/src/common/state/redis.h
+++ /dev/null
@@ -1,356 +0,0 @@
-#ifndef REDIS_H
-#define REDIS_H
-
-#include <unordered_map>
-
-#include "db.h"
-#include "db_client_table.h"
-#include "object_table.h"
-#include "task_table.h"
-
-#include "hiredis/hiredis.h"
-#include "hiredis/async.h"
-
-#define LOG_REDIS_ERROR(context, M, ...)                                     \
-  RAY_LOG(ERROR) << "Redis error " << context->err << " " << context->errstr \
-                 << "; " << M
-
-#define LOG_REDIS_DEBUG(context, M, ...)                                     \
-  RAY_LOG(DEBUG) << "Redis error " << context->err << " " << context->errstr \
-                 << "; " << M;
-
-struct DBHandle {
-  /** String that identifies this client type. */
-  char *client_type;
-  /** Unique ID for this client. */
-  DBClientID client;
-  /** Primary redis context for all non-subscribe connections. This is used for
-   * the database client table, heartbeats, and errors that should be pushed to
-   * the driver. */
-  redisAsyncContext *context;
-  /** Primary redis context for "subscribe" communication. A separate context
-   *  is needed for this communication (see
-   *  https://github.com/redis/hiredis/issues/55). This is used for the
-   *  database client table, heartbeats, and errors that should be pushed to
-   *  the driver. */
-  redisAsyncContext *subscribe_context;
-  /** Redis contexts for shards for all non-subscribe connections. All requests
-   *  to the object table, task table, and event table should be directed here.
-   *  The correct shard can be retrieved using get_redis_context below. */
-  std::vector<redisAsyncContext *> contexts;
-  /** Redis contexts for shards for "subscribe" communication. All requests
-   *  to the object table, task table, and event table should be directed here.
-   *  The correct shard can be retrieved using get_redis_context below. */
-  std::vector<redisAsyncContext *> subscribe_contexts;
-  /** The event loop this global state store connection is part of. */
-  event_loop *loop;
-  /** Index of the database connection in the event loop */
-  int64_t db_index;
-  /** Cache for the IP addresses of db clients. This is an unordered map mapping
-   *  client IDs to addresses. */
-  std::unordered_map<DBClientID, DBClient> db_client_cache;
-  /** Redis context for synchronous connections. This should only be used very
-   *  rarely, it is not asynchronous. */
-  redisContext *sync_context;
-};
-
-/**
- * Get the Redis asynchronous context responsible for non-subscription
- * communication for the given UniqueID.
- *
- * @param db The database handle.
- * @param id The ID whose location we are querying for.
- * @return The redisAsyncContext responsible for the given ID.
- */
-redisAsyncContext *get_redis_context(DBHandle *db, UniqueID id);
-
-/**
- * Get the Redis asynchronous context responsible for subscription
- * communication for the given UniqueID.
- *
- * @param db The database handle.
- * @param id The ID whose location we are querying for.
- * @return The redisAsyncContext responsible for the given ID.
- */
-redisAsyncContext *get_redis_subscribe_context(DBHandle *db, UniqueID id);
-
-/**
- * Get a list of Redis shard IP addresses from the primary shard.
- *
- * @param context A Redis context connected to the primary shard.
- * @param db_shards_addresses The IP addresses for the shards registered
- *        with the primary shard will be added to this vector.
- * @param db_shards_ports  The IP ports for the shards registered with the
- *        primary shard will be added to this vector, in the same order as
- *        db_shards_addresses.
- */
-void get_redis_shards(redisContext *context,
-                      std::vector<std::string> &db_shards_addresses,
-                      std::vector<int> &db_shards_ports);
-
-void redis_cache_set_db_client(DBHandle *db, DBClient client);
-
-DBClient redis_cache_get_db_client(DBHandle *db, DBClientID db_client_id);
-
-void redis_object_table_get_entry(redisAsyncContext *c,
-                                  void *r,
-                                  void *privdata);
-
-void object_table_lookup_callback(redisAsyncContext *c,
-                                  void *r,
-                                  void *privdata);
-
-/*
- * ==== Redis object table functions ====
- */
-
-/**
- * Lookup object table entry in redis.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_object_table_lookup(TableCallbackData *callback_data);
-
-/**
- * Add a location entry to the object table in redis.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_object_table_add(TableCallbackData *callback_data);
-
-/**
- * Remove a location entry from the object table in redis.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_object_table_remove(TableCallbackData *callback_data);
-
-/**
- * Create a client-specific channel for receiving notifications from the object
- * table.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_object_table_subscribe_to_notifications(
-    TableCallbackData *callback_data);
-
-/**
- * Request notifications about when certain objects become available.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_object_table_request_notifications(TableCallbackData *callback_data);
-
-/**
- * Add a new object to the object table in redis.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_result_table_add(TableCallbackData *callback_data);
-
-/**
- * Lookup the task that created the object in redis. The result is the task ID.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_result_table_lookup(TableCallbackData *callback_data);
-
-/**
- * Callback invoked when the reply from the object table lookup command is
- * received.
- *
- * @param c Redis context.
- * @param r Reply.
- * @param privdata Data associated to the callback.
- * @return Void.
- */
-void redis_object_table_lookup_callback(redisAsyncContext *c,
-                                        void *r,
-                                        void *privdata);
-
-/*
- * ==== Redis task table function =====
- */
-
-/**
- * Get a task table entry, including the task spec and the task's scheduling
- * information.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_task_table_get_task(TableCallbackData *callback_data);
-
-/**
- * Add a task table entry with a new task spec and the task's scheduling
- * information.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_task_table_add_task(TableCallbackData *callback_data);
-
-/**
- * Update a task table entry with the task's scheduling information.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_task_table_update(TableCallbackData *callback_data);
-
-/**
- * Update a task table entry with the task's scheduling information, if the
- * task's current scheduling information matches the test value.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_task_table_test_and_update(TableCallbackData *callback_data);
-
-/**
- * Callback invoked when the reply from the task push command is received.
- *
- * @param c Redis context.
- * @param r Reply (not used).
- * @param privdata Data associated to the callback.
- * @return Void.
- */
-void redis_task_table_publish_push_callback(redisAsyncContext *c,
-                                            void *r,
-                                            void *privdata);
-
-/**
- * Callback invoked when the reply from the task publish command is received.
- *
- * @param c Redis context.
- * @param r Reply (not used).
- * @param privdata Data associated to the callback.
- * @return Void.
- */
-void redis_task_table_publish_publish_callback(redisAsyncContext *c,
-                                               void *r,
-                                               void *privdata);
-
-/**
- * Subscribe to updates of the task table.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_task_table_subscribe(TableCallbackData *callback_data);
-
-/**
- * Remove a client from the db clients table.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_db_client_table_remove(TableCallbackData *callback_data);
-
-/**
- * Subscribe to updates from the db client table.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_db_client_table_subscribe(TableCallbackData *callback_data);
-
-/**
- * Subscribe to updates from the local scheduler table.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_local_scheduler_table_subscribe(TableCallbackData *callback_data);
-
-/**
- * Publish an update to the local scheduler table.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_local_scheduler_table_send_info(TableCallbackData *callback_data);
-
-/**
- * Synchronously publish a null update to the local scheduler table signifying
- * that we are about to exit.
- *
- * @param db The database handle of the dying local scheduler.
- * @return Void.
- */
-void redis_local_scheduler_table_disconnect(DBHandle *db);
-
-/**
- * Subscribe to updates from the driver table.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_driver_table_subscribe(TableCallbackData *callback_data);
-
-/**
- * Publish an update to the driver table.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_driver_table_send_driver_death(TableCallbackData *callback_data);
-
-void redis_plasma_manager_send_heartbeat(TableCallbackData *callback_data);
-
-/**
- * Marks an actor as removed. This prevents the actor from being resurrected.
- *
- * @param db The database handle.
- * @param actor_id The actor id to mark as removed.
- * @return Void.
- */
-void redis_actor_table_mark_removed(DBHandle *db, ActorID actor_id);
-
-/// Publish an actor creation notification.
-///
-/// \param callback_data Data structure containing redis connection and timeout
-///      information.
-/// \return Void.
-void redis_publish_actor_creation_notification(
-    TableCallbackData *callback_data);
-
-/**
- * Subscribe to updates about newly created actors.
- *
- * @param callback_data Data structure containing redis connection and timeout
- *        information.
- * @return Void.
- */
-void redis_actor_notification_table_subscribe(TableCallbackData *callback_data);
-
-void redis_object_info_subscribe(TableCallbackData *callback_data);
-
-void redis_push_error(TableCallbackData *callback_data);
-
-#endif /* REDIS_H */
diff --git a/src/common/state/table.cc b/src/common/state/table.cc
deleted file mode 100644
index 8269c2b1e7396..0000000000000
--- a/src/common/state/table.cc
+++ /dev/null
@@ -1,200 +0,0 @@
-#include "table.h"
-
-#include <unordered_map>
-#include <inttypes.h>
-#include "redis.h"
-
-BaseCallbackData::BaseCallbackData(void *data) {
-  data_ = data;
-}
-
-BaseCallbackData::~BaseCallbackData(void) {}
-
-void *BaseCallbackData::Get(void) {
-  return data_;
-}
-
-CommonCallbackData::CommonCallbackData(void *data) : BaseCallbackData(data) {}
-
-CommonCallbackData::~CommonCallbackData(void) {
-  free(data_);
-}
-
-TaskCallbackData::TaskCallbackData(Task *task_data)
-    : BaseCallbackData(task_data) {}
-
-TaskCallbackData::~TaskCallbackData(void) {
-  Task *task = (Task *) data_;
-  Task_free(task);
-}
-
-/* The default behavior is to retry every ten seconds forever. */
-static const RetryInfo default_retry = {.num_retries = -1,
-                                        .timeout = 10000,
-                                        .fail_callback = NULL};
-
-static int64_t callback_data_id = 0;
-
-TableCallbackData *init_table_callback(DBHandle *db_handle,
-                                       UniqueID id,
-                                       const char *label,
-                                       OWNER BaseCallbackData *data,
-                                       RetryInfo *retry,
-                                       table_done_callback done_callback,
-                                       table_retry_callback retry_callback,
-                                       void *user_context) {
-  RAY_CHECK(db_handle);
-  RAY_CHECK(db_handle->loop);
-  RAY_CHECK(data);
-  /* If no retry info is provided, use the default retry info. */
-  if (retry == NULL) {
-    retry = (RetryInfo *) &default_retry;
-  }
-  RAY_CHECK(retry);
-  /* Allocate and initialize callback data structure for object table */
-  TableCallbackData *callback_data =
-      (TableCallbackData *) malloc(sizeof(TableCallbackData));
-  RAY_CHECK(callback_data != NULL) << "Memory allocation error!";
-  callback_data->id = id;
-  callback_data->label = label;
-  callback_data->retry = *retry;
-  callback_data->done_callback = done_callback;
-  callback_data->retry_callback = retry_callback;
-  callback_data->data = data;
-  callback_data->requests_info = NULL;
-  callback_data->user_context = user_context;
-  callback_data->db_handle = db_handle;
-  /* TODO(ekl) set a retry timer once we've figured out the retry conditions
-   * and have a solution to the O(n^2) ae timers issue. For now, use a dummy
-   * timer id to uniquely id this callback. */
-  callback_data->timer_id = callback_data_id++;
-  outstanding_callbacks_add(callback_data);
-
-  RAY_LOG(DEBUG) << "Initializing table command " << callback_data->label
-                 << " with timer ID " << callback_data->timer_id;
-  callback_data->retry_callback(callback_data);
-
-  return callback_data;
-}
-
-void destroy_timer_callback(event_loop *loop,
-                            TableCallbackData *callback_data) {
-  /* This is commented out because we no longer add timers to the event loop for
-   * each Redis command. */
-  // event_loop_remove_timer(loop, callback_data->timer_id);
-  destroy_table_callback(callback_data);
-}
-
-void remove_timer_callback(event_loop *loop, TableCallbackData *callback_data) {
-  /* This is commented out because we no longer add timers to the event loop for
-   * each Redis command. */
-  // event_loop_remove_timer(loop, callback_data->timer_id);
-}
-
-void destroy_table_callback(TableCallbackData *callback_data) {
-  RAY_CHECK(callback_data != NULL);
-
-  if (callback_data->requests_info)
-    free(callback_data->requests_info);
-
-  RAY_CHECK(callback_data->data != NULL);
-  delete callback_data->data;
-  callback_data->data = NULL;
-
-  outstanding_callbacks_remove(callback_data);
-
-  /* Timer is removed via EVENT_LOOP_TIMER_DONE in the timeout callback. */
-  free(callback_data);
-}
-
-int64_t table_timeout_handler(event_loop *loop,
-                              int64_t timer_id,
-                              void *user_context) {
-  RAY_CHECK(loop != NULL);
-  RAY_CHECK(user_context != NULL);
-  TableCallbackData *callback_data = (TableCallbackData *) user_context;
-
-  RAY_CHECK(callback_data->retry.num_retries >= 0 ||
-            callback_data->retry.num_retries == -1);
-  RAY_LOG(WARNING) << "retrying operation " << callback_data->label
-                   << ", retry_count = " << callback_data->retry.num_retries;
-
-  if (callback_data->retry.num_retries == 0) {
-    /* We didn't get a response from the database after exhausting all retries;
-     * let user know, cleanup the state, and remove the timer. */
-    RAY_LOG(WARNING) << "Table command " << callback_data->label
-                     << " with timer ID " << timer_id << " failed";
-    if (callback_data->retry.fail_callback) {
-      callback_data->retry.fail_callback(callback_data->id,
-                                         callback_data->user_context,
-                                         callback_data->data->Get());
-    }
-    destroy_table_callback(callback_data);
-    return EVENT_LOOP_TIMER_DONE;
-  }
-
-  /* Decrement retry count and try again. We use -1 to indicate infinite
-   * retries. */
-  if (callback_data->retry.num_retries != -1) {
-    callback_data->retry.num_retries--;
-  }
-  callback_data->retry_callback(callback_data);
-  return callback_data->retry.timeout;
-}
-
-/**
- * Unordered map maintaining the outstanding callbacks.
- *
- * This unordered map is used to handle the following case:
- * - a table command is issued with an associated callback and a callback data
- *   structure;
- * - the last timeout associated to this command expires, as a result the
- *   callback data structure is freed;
- * - a reply arrives, but now the callback data structure is gone, so we have
- *   to ignore this reply;
- *
- * This unordered map enables us to ignore such replies. The operations on the
- * unordered map are as follows.
- *
- * When we issue a table command and a timeout event to wait for the reply, we
- * add a new entry to the unordered map that is keyed by the ID of the timer.
- * Note that table commands must have unique timer IDs, which are assigned by
- * the Redis ae event loop.
- *
- * When we receive the reply, we check whether the callback still exists in
- * this unordered map, and if not we just ignore the reply. If the callback does
- * exist, the reply receiver is responsible for removing the timer and the
- * entry associated to the callback, or else the timeout handler will continue
- * firing.
- *
- * When the last timeout associated to the command expires we remove the entry
- * associated to the callback.
- */
-static std::unordered_map<timer_id, TableCallbackData *> outstanding_callbacks;
-
-void outstanding_callbacks_add(TableCallbackData *callback_data) {
-  outstanding_callbacks[callback_data->timer_id] = callback_data;
-}
-
-TableCallbackData *outstanding_callbacks_find(int64_t key) {
-  auto it = outstanding_callbacks.find(key);
-  if (it != outstanding_callbacks.end()) {
-    return it->second;
-  }
-  return NULL;
-}
-
-void outstanding_callbacks_remove(TableCallbackData *callback_data) {
-  outstanding_callbacks.erase(callback_data->timer_id);
-}
-
-void destroy_outstanding_callbacks(event_loop *loop) {
-  /* We have to be careful because destroy_timer_callback modifies
-   * outstanding_callbacks in place */
-  auto it = outstanding_callbacks.begin();
-  while (it != outstanding_callbacks.end()) {
-    auto next_it = std::next(it, 1);
-    destroy_timer_callback(loop, it->second);
-    it = next_it;
-  }
-}
diff --git a/src/common/state/table.h b/src/common/state/table.h
deleted file mode 100644
index 1fadcf339cef3..0000000000000
--- a/src/common/state/table.h
+++ /dev/null
@@ -1,216 +0,0 @@
-#ifndef TABLE_H
-#define TABLE_H
-
-#include "common.h"
-#include "task.h"
-#include "db.h"
-
-typedef struct TableCallbackData TableCallbackData;
-
-/* An abstract class for any data passed by the user into a table operation.
- * This class wraps arbitrary pointers and allows the caller to define a custom
- * destructor, for data that is not allocated with malloc. */
-class BaseCallbackData {
- public:
-  BaseCallbackData(void *data);
-  virtual ~BaseCallbackData(void) = 0;
-
-  /* Return the pointer to the data. */
-  void *Get(void);
-
- protected:
-  /* The pointer to the data. */
-  void *data_;
-};
-
-/* A common class for malloc'ed data passed by the user into a table operation.
- * This should ONLY be used when only a free is necessary.  */
-class CommonCallbackData : public BaseCallbackData {
- public:
-  CommonCallbackData(void *data);
-  ~CommonCallbackData(void);
-};
-
-/* A class for Task data passed by the user into a table operation. This calls
- * task cleanup in the destructor. */
-class TaskCallbackData : public BaseCallbackData {
- public:
-  TaskCallbackData(Task *task_data);
-  ~TaskCallbackData(void);
-};
-
-typedef void *table_done_callback;
-
-/* The callback called when the database operation hasn't completed after
- * the number of retries specified for the operation.
- *
- * @param id The unique ID that identifies this callback. Examples include an
- *        object ID or task ID.
- * @param user_context The state context for the callback. This is equivalent
- *        to the user_context field in TableCallbackData.
- * @param user_data A data argument for the callback. This is equivalent to the
- *        data field in TableCallbackData. The user is responsible for
- *        freeing user_data.
- */
-typedef void (*table_fail_callback)(UniqueID id,
-                                    void *user_context,
-                                    void *user_data);
-
-typedef void (*table_retry_callback)(TableCallbackData *callback_data);
-
-/**
- * Data structure consolidating the retry related variables. If a NULL
- * RetryInfo struct is used, the default behavior will be to retry infinitely
- * many times.
- */
-typedef struct {
-  /** Number of retries. This field will be decremented every time a retry
-   *  occurs (unless the value is -1). If this value is -1, then there will be
-   *  infinitely many retries. */
-  int num_retries;
-  /** Timeout, in milliseconds. */
-  uint64_t timeout;
-  /** The callback that will be called if there are no more retries left. */
-  table_fail_callback fail_callback;
-} RetryInfo;
-
-struct TableCallbackData {
-  /** ID of the entry in the table that we are going to look up, remove or add.
-   */
-  UniqueID id;
-  /** A label to identify the original request for logging purposes. */
-  const char *label;
-  /** The callback that will be called when results is returned. */
-  table_done_callback done_callback;
-  /** The callback that will be called to initiate the next try. */
-  table_retry_callback retry_callback;
-  /** Retry information containing the remaining number of retries, the timeout
-   *  before the next retry, and a pointer to the failure callback.
-   */
-  RetryInfo retry;
-  /** Pointer to the data that is entered into the table. This can be used to
-   *  pass the result of the call to the callback. The callback takes ownership
-   *  over this data and will free it. */
-  BaseCallbackData *data;
-  /** Pointer to the data used internally to handle multiple database requests.
-   */
-  void *requests_info;
-  /** User context. */
-  void *user_context;
-  /** Handle to db. */
-  DBHandle *db_handle;
-  /** Handle to timer. */
-  int64_t timer_id;
-};
-
-/**
- * Function to handle the timeout event.
- *
- * @param loop Event loop.
- * @param timer_id Timer identifier.
- * @param context Pointer to the callback data for the object table
- * @return Timeout to reset the timer if we need to try again, or
- *         EVENT_LOOP_TIMER_DONE if retry_count == 0.
- */
-int64_t table_timeout_handler(event_loop *loop,
-                              int64_t timer_id,
-                              void *context);
-
-/**
- * Initialize the table callback and call the retry_callback for the first time.
- *
- * @param db_handle Database handle.
- * @param id ID of the object that is looked up, added or removed.
- * @param label A string label to identify the type of table request for
- *        logging purposes.
- * @param data Data entered into the table. Shall be freed by the user. Caller
- *        must specify a destructor by wrapping a void *pointer in a
- *        BaseCallbackData class.
- * @param retry Retry relevant information: retry timeout, number of remaining
- *        retries, and retry callback.
- * @param done_callback Function to be called when database returns result.
- * @param fail_callback Function to be called when number of retries is
- *        exhausted.
- * @param user_context Context that can be provided by the user and will be
- *        passed on to the various callbacks.
- * @return New table callback data struct.
- */
-TableCallbackData *init_table_callback(DBHandle *db_handle,
-                                       UniqueID id,
-                                       const char *label,
-                                       OWNER BaseCallbackData *data,
-                                       RetryInfo *retry,
-                                       table_done_callback done_callback,
-                                       table_retry_callback retry_callback,
-                                       void *user_context);
-
-/**
- * Destroy any state associated with the callback data. This removes all
- * associated state from the outstanding callbacks unordered map and frees any
- * associated memory. This does not remove any associated timer events.
- *
- * @param callback_data The pointer to the data structure of the callback we
- *        want to remove.
- * @return Void.
- */
-void destroy_table_callback(TableCallbackData *callback_data);
-
-/**
- * Destroy all state events associated with the callback data, including memory
- * and timer events.
- *
- * @param loop The event loop.
- * @param callback_data The pointer to the data structure of the callback we
- *        want to remove.
- * @return Void.
- */
-void destroy_timer_callback(event_loop *loop, TableCallbackData *callback_data);
-
-/**
- * Remove the callback timer without destroying the callback data.
- *
- * @param loop The event loop.
- * @param callback_data The pointer to the data structure of the callback.
- * @return Void.
- */
-void remove_timer_callback(event_loop *loop, TableCallbackData *callback_data);
-
-/**
- * Add an outstanding callback entry.
- *
- * @param callback_data The pointer to the data structure of the callback we
- *        want to insert.
- * @return None.
- */
-void outstanding_callbacks_add(TableCallbackData *callback_data);
-
-/**
- * Find an outstanding callback entry.
- *
- * @param key The key for the outstanding callbacks unordered map. We use the
- *        timer ID assigned by the Redis ae event loop.
- * @return Returns the callback data if found, NULL otherwise.
- */
-TableCallbackData *outstanding_callbacks_find(int64_t key);
-
-/**
- * Remove an outstanding callback entry. This only removes the callback entry
- * from the unordered map. It does not free the entry or remove any associated
- * timer events.
- *
- * @param callback_data The pointer to the data structure of the callback we
- *        want to remove.
- * @return Void.
- */
-void outstanding_callbacks_remove(TableCallbackData *callback_data);
-
-/**
- * Destroy all outstanding callbacks and remove their associated timer events
- * from the event loop.
- *
- * @param loop The event loop from which we want to remove the timer events.
- * @return Void.
- */
-void destroy_outstanding_callbacks(event_loop *loop);
-
-#endif /* TABLE_H */
diff --git a/src/common/state/task_table.cc b/src/common/state/task_table.cc
deleted file mode 100644
index 514350b08353c..0000000000000
--- a/src/common/state/task_table.cc
+++ /dev/null
@@ -1,80 +0,0 @@
-#include "task_table.h"
-#include "redis.h"
-
-#define NUM_DB_REQUESTS 2
-
-void task_table_get_task(DBHandle *db_handle,
-                         TaskID task_id,
-                         RetryInfo *retry,
-                         task_table_get_callback get_callback,
-                         void *user_context) {
-  init_table_callback(
-      db_handle, task_id, __func__, new CommonCallbackData(NULL), retry,
-      (void *) get_callback, redis_task_table_get_task, user_context);
-}
-
-void task_table_add_task(DBHandle *db_handle,
-                         OWNER Task *task,
-                         RetryInfo *retry,
-                         task_table_done_callback done_callback,
-                         void *user_context) {
-  init_table_callback(db_handle, Task_task_id(task), __func__,
-                      new TaskCallbackData(task), retry,
-                      (table_done_callback) done_callback,
-                      redis_task_table_add_task, user_context);
-}
-
-void task_table_update(DBHandle *db_handle,
-                       OWNER Task *task,
-                       RetryInfo *retry,
-                       task_table_done_callback done_callback,
-                       void *user_context) {
-  init_table_callback(db_handle, Task_task_id(task), __func__,
-                      new TaskCallbackData(task), retry,
-                      (table_done_callback) done_callback,
-                      redis_task_table_update, user_context);
-}
-
-void task_table_test_and_update(
-    DBHandle *db_handle,
-    TaskID task_id,
-    DBClientID test_local_scheduler_id,
-    TaskStatus test_state_bitmask,
-    TaskStatus update_state,
-    RetryInfo *retry,
-    task_table_test_and_update_callback done_callback,
-    void *user_context) {
-  TaskTableTestAndUpdateData *update_data =
-      (TaskTableTestAndUpdateData *) malloc(sizeof(TaskTableTestAndUpdateData));
-  update_data->test_local_scheduler_id = test_local_scheduler_id;
-  update_data->test_state_bitmask = test_state_bitmask;
-  update_data->update_state = update_state;
-  /* Update the task entry's local scheduler with this client's ID. */
-  update_data->local_scheduler_id = db_handle->client;
-  init_table_callback(db_handle, task_id, __func__,
-                      new CommonCallbackData(update_data), retry,
-                      (table_done_callback) done_callback,
-                      redis_task_table_test_and_update, user_context);
-}
-
-/* TODO(swang): A corresponding task_table_unsubscribe. */
-void task_table_subscribe(DBHandle *db_handle,
-                          DBClientID local_scheduler_id,
-                          TaskStatus state_filter,
-                          task_table_subscribe_callback subscribe_callback,
-                          void *subscribe_context,
-                          RetryInfo *retry,
-                          task_table_done_callback done_callback,
-                          void *user_context) {
-  TaskTableSubscribeData *sub_data =
-      (TaskTableSubscribeData *) malloc(sizeof(TaskTableSubscribeData));
-  sub_data->local_scheduler_id = local_scheduler_id;
-  sub_data->state_filter = state_filter;
-  sub_data->subscribe_callback = subscribe_callback;
-  sub_data->subscribe_context = subscribe_context;
-
-  init_table_callback(db_handle, local_scheduler_id, __func__,
-                      new CommonCallbackData(sub_data), retry,
-                      (table_done_callback) done_callback,
-                      redis_task_table_subscribe, user_context);
-}
diff --git a/src/common/state/task_table.h b/src/common/state/task_table.h
deleted file mode 100644
index 3884ddece8931..0000000000000
--- a/src/common/state/task_table.h
+++ /dev/null
@@ -1,190 +0,0 @@
-#ifndef task_table_H
-#define task_table_H
-
-#include "db.h"
-#include "table.h"
-#include "task.h"
-
-/**
- * The task table is a message bus that is used for communication between local
- * and global schedulers (and also persisted to the state database). Here are
- * examples of events that are recorded by the task table:
- *
- * 1) Local schedulers write to it when submitting a task to the global
- *    scheduler.
- * 2) The global scheduler subscribes to updates to the task table to get tasks
- *    submitted by local schedulers.
- * 3) The global scheduler writes to it when assigning a task to a local
- *    scheduler.
- * 4) Local schedulers subscribe to updates to the task table to get tasks
- *    assigned to them by the global scheduler.
- * 5) Local schedulers write to it when a task finishes execution.
- */
-
-/* Callback called when a task table write operation completes. */
-typedef void (*task_table_done_callback)(TaskID task_id, void *user_context);
-
-/* Callback called when a task table read operation completes. If the task ID
- * was not in the task table, then the task pointer will be NULL. */
-typedef void (*task_table_get_callback)(Task *task, void *user_context);
-
-/* Callback called when a task table test-and-update operation completes. If
- * the task ID was not in the task table, then the task pointer will be NULL.
- * If the update succeeded, the updated field will be set to true. */
-typedef void (*task_table_test_and_update_callback)(Task *task,
-                                                    void *user_context,
-                                                    bool updated);
-
-/**
- * Get a task's entry from the task table.
- *
- * @param db_handle Database handle.
- * @param task_id The ID of the task we want to look up.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Function to be called when database returns result.
- * @param user_context Data that will be passed to done_callback and
- *        fail_callback.
- * @return Void.
- */
-void task_table_get_task(DBHandle *db,
-                         TaskID task_id,
-                         RetryInfo *retry,
-                         task_table_get_callback get_callback,
-                         void *user_context);
-
-/**
- * Add a task entry, including task spec and scheduling information, to the task
- * table. This will overwrite any task already in the task table with the same
- * task ID.
- *
- * @param db_handle Database handle.
- * @param task The task entry to add to the table.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Function to be called when database returns result.
- * @param user_context Data that will be passed to done_callback and
- *        fail_callback.
- * @return Void.
- */
-void task_table_add_task(DBHandle *db_handle,
-                         OWNER Task *task,
-                         RetryInfo *retry,
-                         task_table_done_callback done_callback,
-                         void *user_context);
-
-/*
- *  ==== Publish the task table ====
- */
-
-/**
- * Update a task's scheduling information in the task table. This assumes that
- * the task spec already exists in the task table entry.
- *
- * @param db_handle Database handle.
- * @param task The task entry to add to the table. The task spec in the entry is
- *        ignored.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Function to be called when database returns result.
- * @param user_context Data that will be passed to done_callback and
- *        fail_callback.
- * @return Void.
- */
-void task_table_update(DBHandle *db_handle,
-                       OWNER Task *task,
-                       RetryInfo *retry,
-                       task_table_done_callback done_callback,
-                       void *user_context);
-
-/**
- * Update a task's scheduling information in the task table, if the current
- * value matches the given test value. If the update succeeds, it also updates
- * the task entry's local scheduler ID with the ID of the client who called
- * this function. This assumes that the task spec already exists in the task
- * table entry.
- *
- * @param db_handle Database handle.
- * @param task_id The task ID of the task entry to update.
- * @param test_local_scheduler_id The local scheduler ID to test the current
- *        local scheduler ID against. If not NIL_ID, and if the current local
- *        scheduler ID does not match it, then the update will not happen.
- * @param test_state_bitmask The bitmask to apply to the task entry's current
- *        scheduling state.  The update happens if and only if the current
- *        scheduling state AND-ed with the bitmask is greater than 0 and the
- *        local scheduler ID test passes.
- * @param update_state The value to update the task entry's scheduling state
- *        with, if the current state matches test_state_bitmask.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Function to be called when database returns result.
- * @param user_context Data that will be passed to done_callback and
- *        fail_callback.
- * @return Void.
- */
-void task_table_test_and_update(
-    DBHandle *db_handle,
-    TaskID task_id,
-    DBClientID test_local_scheduler_id,
-    TaskStatus test_state_bitmask,
-    TaskStatus update_state,
-    RetryInfo *retry,
-    task_table_test_and_update_callback done_callback,
-    void *user_context);
-
-/* Data that is needed to test and set the task's scheduling state. */
-typedef struct {
-  /** The value to test the current local scheduler ID against. This field is
-   *  ignored if equal to NIL_ID. */
-  DBClientID test_local_scheduler_id;
-  TaskStatus test_state_bitmask;
-  TaskStatus update_state;
-  DBClientID local_scheduler_id;
-} TaskTableTestAndUpdateData;
-
-/*
- *  ==== Subscribing to the task table ====
- */
-
-/* Callback for subscribing to the task table. */
-typedef void (*task_table_subscribe_callback)(Task *task, void *user_context);
-
-/**
- * Register a callback for a task event. An event is any update of a task in
- * the task table, produced by task_table_add_task or task_table_add_task.
- * Events include changes to the task's scheduling state or changes to the
- * task's local scheduler ID.
- *
- * @param db_handle Database handle.
- * @param subscribe_callback Callback that will be called when the task table is
- *        updated.
- * @param subscribe_context Context that will be passed into the
- *        subscribe_callback.
- * @param local_scheduler_id The db_client_id of the local scheduler whose
- *        events we want to listen to. If you want to subscribe to updates from
- *        all local schedulers, pass in NIL_ID.
- * @param state_filter Events we want to listen to. Can have values from the
- *        enum "scheduling_state" in task.h.
- *        TODO(pcm): Make it possible to combine these using flags like
- *        TASK_STATUS_WAITING | TASK_STATUS_SCHEDULED.
- * @param retry Information about retrying the request to the database.
- * @param done_callback Function to be called when database returns result.
- * @param user_context Data that will be passed to done_callback and
- *        fail_callback.
- * @return Void.
- */
-void task_table_subscribe(DBHandle *db_handle,
-                          DBClientID local_scheduler_id,
-                          TaskStatus state_filter,
-                          task_table_subscribe_callback subscribe_callback,
-                          void *subscribe_context,
-                          RetryInfo *retry,
-                          task_table_done_callback done_callback,
-                          void *user_context);
-
-/* Data that is needed to register task table subscribe callbacks with the state
- * database. */
-typedef struct {
-  DBClientID local_scheduler_id;
-  TaskStatus state_filter;
-  task_table_subscribe_callback subscribe_callback;
-  void *subscribe_context;
-} TaskTableSubscribeData;
-
-#endif /* task_table_H */
diff --git a/src/common/task.cc b/src/common/task.cc
deleted file mode 100644
index 60110fe225432..0000000000000
--- a/src/common/task.cc
+++ /dev/null
@@ -1,606 +0,0 @@
-#include <limits.h>
-
-#include "common_protocol.h"
-
-#include "task.h"
-
-extern "C" {
-#include "sha256.h"
-}
-
-ObjectID task_compute_return_id(TaskID task_id, int64_t return_index) {
-  /* Here, return_indices need to be >= 0, so we can use negative
-   * indices for put. */
-  RAY_DCHECK(return_index >= 0);
-  /* TODO(rkn): This line requires object and task IDs to be the same size. */
-  ObjectID return_id = task_id;
-  int64_t *first_bytes = (int64_t *) &return_id;
-  /* XOR the first bytes of the object ID with the return index. We add one so
-   * the first return ID is not the same as the task ID. */
-  *first_bytes = *first_bytes ^ (return_index + 1);
-  return return_id;
-}
-
-ObjectID task_compute_put_id(TaskID task_id, int64_t put_index) {
-  RAY_DCHECK(put_index >= 0);
-  /* TODO(pcm): This line requires object and task IDs to be the same size. */
-  ObjectID put_id = task_id;
-  int64_t *first_bytes = (int64_t *) &put_id;
-  /* XOR the first bytes of the object ID with the return index. We add one so
-   * the first return ID is not the same as the task ID. */
-  *first_bytes = *first_bytes ^ (-put_index - 1);
-  return put_id;
-}
-
-class TaskBuilder {
- public:
-  void Start(UniqueID driver_id,
-             TaskID parent_task_id,
-             int64_t parent_counter,
-             ActorID actor_creation_id,
-             ObjectID actor_creation_dummy_object_id,
-             ActorID actor_id,
-             ActorHandleID actor_handle_id,
-             int64_t actor_counter,
-             bool is_actor_checkpoint_method,
-             FunctionID function_id,
-             int64_t num_returns) {
-    driver_id_ = driver_id;
-    parent_task_id_ = parent_task_id;
-    parent_counter_ = parent_counter;
-    actor_creation_id_ = actor_creation_id;
-    actor_creation_dummy_object_id_ = actor_creation_dummy_object_id;
-    actor_id_ = actor_id;
-    actor_handle_id_ = actor_handle_id;
-    actor_counter_ = actor_counter;
-    is_actor_checkpoint_method_ = is_actor_checkpoint_method;
-    function_id_ = function_id;
-    num_returns_ = num_returns;
-
-    /* Compute hashes. */
-    sha256_init(&ctx);
-    sha256_update(&ctx, (BYTE *) &driver_id, sizeof(driver_id));
-    sha256_update(&ctx, (BYTE *) &parent_task_id, sizeof(parent_task_id));
-    sha256_update(&ctx, (BYTE *) &parent_counter, sizeof(parent_counter));
-    sha256_update(&ctx, (BYTE *) &actor_creation_id, sizeof(actor_creation_id));
-    sha256_update(&ctx, (BYTE *) &actor_creation_dummy_object_id,
-                  sizeof(actor_creation_dummy_object_id));
-    sha256_update(&ctx, (BYTE *) &actor_id, sizeof(actor_id));
-    sha256_update(&ctx, (BYTE *) &actor_counter, sizeof(actor_counter));
-    sha256_update(&ctx, (BYTE *) &is_actor_checkpoint_method,
-                  sizeof(is_actor_checkpoint_method));
-    sha256_update(&ctx, (BYTE *) &function_id, sizeof(function_id));
-  }
-
-  void NextReferenceArgument(ObjectID object_ids[], int num_object_ids) {
-    args.push_back(
-        CreateArg(fbb, to_flatbuf(fbb, &object_ids[0], num_object_ids)));
-    sha256_update(&ctx, (BYTE *) &object_ids[0],
-                  sizeof(object_ids[0]) * num_object_ids);
-  }
-
-  void NextValueArgument(uint8_t *value, int64_t length) {
-    auto arg = fbb.CreateString((const char *) value, length);
-    auto empty_ids = fbb.CreateVectorOfStrings({});
-    args.push_back(CreateArg(fbb, empty_ids, arg));
-    sha256_update(&ctx, (BYTE *) value, length);
-  }
-
-  void SetRequiredResource(const std::string &resource_name, double value) {
-    RAY_CHECK(resource_map_.count(resource_name) == 0);
-    resource_map_[resource_name] = value;
-  }
-
-  uint8_t *Finish(int64_t *size) {
-    /* Add arguments. */
-    auto arguments = fbb.CreateVector(args);
-    /* Update hash. */
-    BYTE buff[DIGEST_SIZE];
-    sha256_final(&ctx, buff);
-    TaskID task_id;
-    RAY_CHECK(sizeof(task_id) <= DIGEST_SIZE);
-    memcpy(&task_id, buff, sizeof(task_id));
-    /* Add return object IDs. */
-    std::vector<flatbuffers::Offset<flatbuffers::String>> returns;
-    for (int64_t i = 0; i < num_returns_; i++) {
-      ObjectID return_id = task_compute_return_id(task_id, i);
-      returns.push_back(to_flatbuf(fbb, return_id));
-    }
-    /* Create TaskInfo. */
-    auto message = CreateTaskInfo(
-        fbb, to_flatbuf(fbb, driver_id_), to_flatbuf(fbb, task_id),
-        to_flatbuf(fbb, parent_task_id_), parent_counter_,
-        to_flatbuf(fbb, actor_creation_id_),
-        to_flatbuf(fbb, actor_creation_dummy_object_id_),
-        to_flatbuf(fbb, actor_id_), to_flatbuf(fbb, actor_handle_id_),
-        actor_counter_, is_actor_checkpoint_method_,
-        to_flatbuf(fbb, function_id_), arguments, fbb.CreateVector(returns),
-        map_to_flatbuf(fbb, resource_map_));
-    /* Finish the TaskInfo. */
-    fbb.Finish(message);
-    *size = fbb.GetSize();
-    uint8_t *result = (uint8_t *) malloc(*size);
-    memcpy(result, fbb.GetBufferPointer(), *size);
-    fbb.Clear();
-    args.clear();
-    resource_map_.clear();
-    return result;
-  }
-
- private:
-  flatbuffers::FlatBufferBuilder fbb;
-  std::vector<flatbuffers::Offset<Arg>> args;
-  SHA256_CTX ctx;
-
-  /* Data for the builder. */
-  UniqueID driver_id_;
-  TaskID parent_task_id_;
-  int64_t parent_counter_;
-  ActorID actor_creation_id_;
-  ObjectID actor_creation_dummy_object_id_;
-  ActorID actor_id_;
-  ActorID actor_handle_id_;
-  int64_t actor_counter_;
-  bool is_actor_checkpoint_method_;
-  FunctionID function_id_;
-  int64_t num_returns_;
-  std::unordered_map<std::string, double> resource_map_;
-};
-
-TaskBuilder *make_task_builder(void) {
-  return new TaskBuilder();
-}
-
-void free_task_builder(TaskBuilder *builder) {
-  delete builder;
-}
-
-bool TaskID_equal(TaskID first_id, TaskID second_id) {
-  return first_id == second_id;
-}
-
-bool TaskID_is_nil(TaskID id) {
-  return id.is_nil();
-}
-
-bool ActorID_equal(ActorID first_id, ActorID second_id) {
-  return first_id == second_id;
-}
-
-bool FunctionID_equal(FunctionID first_id, FunctionID second_id) {
-  return first_id == second_id;
-}
-
-bool FunctionID_is_nil(FunctionID id) {
-  return id.is_nil();
-}
-
-/* Functions for building tasks. */
-
-void TaskSpec_start_construct(TaskBuilder *builder,
-                              UniqueID driver_id,
-                              TaskID parent_task_id,
-                              int64_t parent_counter,
-                              ActorID actor_creation_id,
-                              ObjectID actor_creation_dummy_object_id,
-                              ActorID actor_id,
-                              ActorID actor_handle_id,
-                              int64_t actor_counter,
-                              bool is_actor_checkpoint_method,
-                              FunctionID function_id,
-                              int64_t num_returns) {
-  builder->Start(driver_id, parent_task_id, parent_counter, actor_creation_id,
-                 actor_creation_dummy_object_id, actor_id, actor_handle_id,
-                 actor_counter, is_actor_checkpoint_method, function_id,
-                 num_returns);
-}
-
-TaskSpec *TaskSpec_finish_construct(TaskBuilder *builder, int64_t *size) {
-  return reinterpret_cast<TaskSpec *>(builder->Finish(size));
-}
-
-void TaskSpec_args_add_ref(TaskBuilder *builder,
-                           ObjectID object_ids[],
-                           int num_object_ids) {
-  builder->NextReferenceArgument(&object_ids[0], num_object_ids);
-}
-
-void TaskSpec_args_add_val(TaskBuilder *builder,
-                           uint8_t *value,
-                           int64_t length) {
-  builder->NextValueArgument(value, length);
-}
-
-void TaskSpec_set_required_resource(TaskBuilder *builder,
-                                    const std::string &resource_name,
-                                    double value) {
-  builder->SetRequiredResource(resource_name, value);
-}
-
-/* Functions for reading tasks. */
-
-TaskID TaskSpec_task_id(const TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return from_flatbuf(*message->task_id());
-}
-
-FunctionID TaskSpec_function(TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return from_flatbuf(*message->function_id());
-}
-
-ActorID TaskSpec_actor_id(TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return from_flatbuf(*message->actor_id());
-}
-
-ActorID TaskSpec_actor_handle_id(TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return from_flatbuf(*message->actor_handle_id());
-}
-
-bool TaskSpec_is_actor_task(TaskSpec *spec) {
-  return !TaskSpec_actor_id(spec).is_nil();
-}
-
-ActorID TaskSpec_actor_creation_id(TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return from_flatbuf(*message->actor_creation_id());
-}
-
-ObjectID TaskSpec_actor_creation_dummy_object_id(TaskSpec *spec) {
-  RAY_CHECK(spec);
-  // The task must be an actor method.
-  RAY_CHECK(TaskSpec_is_actor_task(spec));
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return from_flatbuf(*message->actor_creation_dummy_object_id());
-}
-
-bool TaskSpec_is_actor_creation_task(TaskSpec *spec) {
-  return !TaskSpec_actor_creation_id(spec).is_nil();
-}
-
-int64_t TaskSpec_actor_counter(TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return std::abs(message->actor_counter());
-}
-
-bool TaskSpec_is_actor_checkpoint_method(TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return message->is_actor_checkpoint_method();
-}
-
-ObjectID TaskSpec_actor_dummy_object(TaskSpec *spec) {
-  RAY_CHECK(TaskSpec_is_actor_task(spec));
-  /* The last return value for actor tasks is the dummy object that
-   * represents that this task has completed execution. */
-  int64_t num_returns = TaskSpec_num_returns(spec);
-  return TaskSpec_return(spec, num_returns - 1);
-}
-
-UniqueID TaskSpec_driver_id(const TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return from_flatbuf(*message->driver_id());
-}
-
-TaskID TaskSpec_parent_task_id(const TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return from_flatbuf(*message->parent_task_id());
-}
-
-int64_t TaskSpec_parent_counter(TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return message->parent_counter();
-}
-
-int64_t TaskSpec_num_args(TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return message->args()->size();
-}
-
-int64_t TaskSpec_num_args_by_ref(TaskSpec *spec) {
-  int64_t num_args = TaskSpec_num_args(spec);
-  int64_t num_args_by_ref = 0;
-  for (int64_t i = 0; i < num_args; i++) {
-    if (TaskSpec_arg_by_ref(spec, i)) {
-      num_args_by_ref++;
-    }
-  }
-  return num_args_by_ref;
-}
-
-int TaskSpec_arg_id_count(TaskSpec *spec, int64_t arg_index) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  auto ids = message->args()->Get(arg_index)->object_ids();
-  if (ids == nullptr) {
-    return 0;
-  } else {
-    return ids->size();
-  }
-}
-
-ObjectID TaskSpec_arg_id(TaskSpec *spec, int64_t arg_index, int64_t id_index) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return from_flatbuf(
-      *message->args()->Get(arg_index)->object_ids()->Get(id_index));
-}
-
-const uint8_t *TaskSpec_arg_val(TaskSpec *spec, int64_t arg_index) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return (uint8_t *) message->args()->Get(arg_index)->data()->c_str();
-}
-
-int64_t TaskSpec_arg_length(TaskSpec *spec, int64_t arg_index) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return message->args()->Get(arg_index)->data()->size();
-}
-
-int64_t TaskSpec_num_returns(TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return message->returns()->size();
-}
-
-bool TaskSpec_arg_by_ref(TaskSpec *spec, int64_t arg_index) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return message->args()->Get(arg_index)->object_ids()->size() != 0;
-}
-
-ObjectID TaskSpec_return(TaskSpec *spec, int64_t return_index) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return from_flatbuf(*message->returns()->Get(return_index));
-}
-
-double TaskSpec_get_required_resource(const TaskSpec *spec,
-                                      const std::string &resource_name) {
-  // This is a bit ugly. However it shouldn't be much of a performance issue
-  // because there shouldn't be many distinct resources in a single task spec.
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  for (size_t i = 0; i < message->required_resources()->size(); i++) {
-    const ResourcePair *resource_pair = message->required_resources()->Get(i);
-    if (string_from_flatbuf(*resource_pair->key()) == resource_name) {
-      return resource_pair->value();
-    }
-  }
-  return 0;
-}
-
-const std::unordered_map<std::string, double> TaskSpec_get_required_resources(
-    const TaskSpec *spec) {
-  RAY_CHECK(spec);
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec);
-  return map_from_flatbuf(*message->required_resources());
-}
-
-TaskSpec *TaskSpec_copy(TaskSpec *spec, int64_t task_spec_size) {
-  TaskSpec *copy = (TaskSpec *) malloc(task_spec_size);
-  memcpy(copy, spec, task_spec_size);
-  return copy;
-}
-
-void TaskSpec_free(TaskSpec *spec) {
-  free(spec);
-}
-
-TaskExecutionSpec::TaskExecutionSpec(
-    const std::vector<ObjectID> &execution_dependencies,
-    const TaskSpec *spec,
-    int64_t task_spec_size,
-    int spillback_count)
-    : execution_dependencies_(execution_dependencies),
-      task_spec_size_(task_spec_size),
-      last_timestamp_(0),
-      spillback_count_(spillback_count) {
-  TaskSpec *spec_copy = new TaskSpec[task_spec_size_];
-  memcpy(spec_copy, spec, task_spec_size);
-  spec_ = std::unique_ptr<TaskSpec[]>(spec_copy);
-}
-
-TaskExecutionSpec::TaskExecutionSpec(
-    const std::vector<ObjectID> &execution_dependencies,
-    const TaskSpec *spec,
-    int64_t task_spec_size)
-    : TaskExecutionSpec(execution_dependencies, spec, task_spec_size, 0) {}
-
-TaskExecutionSpec::TaskExecutionSpec(TaskExecutionSpec *other)
-    : execution_dependencies_(other->execution_dependencies_),
-      task_spec_size_(other->task_spec_size_),
-      last_timestamp_(other->last_timestamp_),
-      spillback_count_(other->spillback_count_) {
-  TaskSpec *spec_copy = new TaskSpec[task_spec_size_];
-  memcpy(spec_copy, other->spec_.get(), task_spec_size_);
-  spec_ = std::unique_ptr<TaskSpec[]>(spec_copy);
-}
-
-const std::vector<ObjectID> &TaskExecutionSpec::ExecutionDependencies() const {
-  return execution_dependencies_;
-}
-
-void TaskExecutionSpec::SetExecutionDependencies(
-    const std::vector<ObjectID> &dependencies) {
-  execution_dependencies_ = dependencies;
-}
-
-int64_t TaskExecutionSpec::SpecSize() const {
-  return task_spec_size_;
-}
-
-int TaskExecutionSpec::SpillbackCount() const {
-  return spillback_count_;
-}
-
-void TaskExecutionSpec::IncrementSpillbackCount() {
-  ++spillback_count_;
-}
-
-int64_t TaskExecutionSpec::LastTimeStamp() const {
-  return last_timestamp_;
-}
-
-void TaskExecutionSpec::SetLastTimeStamp(int64_t new_timestamp) {
-  last_timestamp_ = new_timestamp;
-}
-
-TaskSpec *TaskExecutionSpec::Spec() const {
-  return spec_.get();
-}
-
-int64_t TaskExecutionSpec::NumDependencies() const {
-  TaskSpec *spec = Spec();
-  int64_t num_dependencies = TaskSpec_num_args(spec);
-  num_dependencies += execution_dependencies_.size();
-  return num_dependencies;
-}
-
-int TaskExecutionSpec::DependencyIdCount(int64_t dependency_index) const {
-  TaskSpec *spec = Spec();
-  /* The first dependencies are the arguments of the task itself, followed by
-   * the execution dependencies. Find the total number of task arguments so
-   * that we can index into the correct list. */
-  int64_t num_args = TaskSpec_num_args(spec);
-  if (dependency_index < num_args) {
-    /* Index into the task arguments. */
-    return TaskSpec_arg_id_count(spec, dependency_index);
-  } else {
-    /* Index into the execution dependencies. */
-    dependency_index -= num_args;
-    RAY_CHECK((size_t) dependency_index < execution_dependencies_.size());
-    /* All elements in the execution dependency list have exactly one ID. */
-    return 1;
-  }
-}
-
-ObjectID TaskExecutionSpec::DependencyId(int64_t dependency_index,
-                                         int64_t id_index) const {
-  TaskSpec *spec = Spec();
-  /* The first dependencies are the arguments of the task itself, followed by
-   * the execution dependencies. Find the total number of task arguments so
-   * that we can index into the correct list. */
-  int64_t num_args = TaskSpec_num_args(spec);
-  if (dependency_index < num_args) {
-    /* Index into the task arguments. */
-    return TaskSpec_arg_id(spec, dependency_index, id_index);
-  } else {
-    /* Index into the execution dependencies. */
-    dependency_index -= num_args;
-    RAY_CHECK((size_t) dependency_index < execution_dependencies_.size());
-    return execution_dependencies_[dependency_index];
-  }
-}
-
-bool TaskExecutionSpec::DependsOn(ObjectID object_id) const {
-  // Iterate through the task arguments to see if it contains object_id.
-  TaskSpec *spec = Spec();
-  int64_t num_args = TaskSpec_num_args(spec);
-  for (int i = 0; i < num_args; ++i) {
-    int count = TaskSpec_arg_id_count(spec, i);
-    for (int j = 0; j < count; j++) {
-      ObjectID arg_id = TaskSpec_arg_id(spec, i, j);
-      if (arg_id == object_id) {
-        return true;
-      }
-    }
-  }
-  // Iterate through the execution dependencies to see if it contains object_id.
-  for (auto dependency_id : execution_dependencies_) {
-    if (dependency_id == object_id) {
-      return true;
-    }
-  }
-  // The requested object ID was not a task argument or an execution dependency.
-  // This task is not dependent on it.
-  return false;
-}
-
-bool TaskExecutionSpec::IsStaticDependency(int64_t dependency_index) const {
-  TaskSpec *spec = Spec();
-  /* The first dependencies are the arguments of the task itself, followed by
-   * the execution dependencies. If the requested dependency index is a task
-   * argument, then it is a task dependency. */
-  int64_t num_args = TaskSpec_num_args(spec);
-  return (dependency_index < num_args);
-}
-
-/* TASK INSTANCES */
-
-Task *Task_alloc(const TaskSpec *spec,
-                 int64_t task_spec_size,
-                 TaskStatus state,
-                 DBClientID local_scheduler_id,
-                 const std::vector<ObjectID> &execution_dependencies) {
-  Task *result = new Task();
-  auto execution_spec =
-      new TaskExecutionSpec(execution_dependencies, spec, task_spec_size);
-  result->execution_spec = std::unique_ptr<TaskExecutionSpec>(execution_spec);
-  result->state = state;
-  result->local_scheduler_id = local_scheduler_id;
-  return result;
-}
-
-Task *Task_alloc(TaskExecutionSpec &execution_spec,
-                 TaskStatus state,
-                 DBClientID local_scheduler_id) {
-  Task *result = new Task();
-  result->execution_spec = std::unique_ptr<TaskExecutionSpec>(
-      new TaskExecutionSpec(&execution_spec));
-  result->state = state;
-  result->local_scheduler_id = local_scheduler_id;
-  return result;
-}
-
-Task *Task_copy(Task *other) {
-  return Task_alloc(*Task_task_execution_spec(other), other->state,
-                    other->local_scheduler_id);
-}
-
-int64_t Task_size(Task *task_arg) {
-  return sizeof(Task) - sizeof(TaskSpec) + task_arg->execution_spec->SpecSize();
-}
-
-TaskStatus Task_state(Task *task) {
-  return task->state;
-}
-
-void Task_set_state(Task *task, TaskStatus state) {
-  task->state = state;
-}
-
-DBClientID Task_local_scheduler(Task *task) {
-  return task->local_scheduler_id;
-}
-
-void Task_set_local_scheduler(Task *task, DBClientID local_scheduler_id) {
-  task->local_scheduler_id = local_scheduler_id;
-}
-
-TaskExecutionSpec *Task_task_execution_spec(Task *task) {
-  return task->execution_spec.get();
-}
-
-TaskID Task_task_id(Task *task) {
-  TaskExecutionSpec *execution_spec = Task_task_execution_spec(task);
-  TaskSpec *spec = execution_spec->Spec();
-  return TaskSpec_task_id(spec);
-}
-
-void Task_free(Task *task) {
-  delete task;
-}
diff --git a/src/common/task.h b/src/common/task.h
deleted file mode 100644
index 3984cfdd51195..0000000000000
--- a/src/common/task.h
+++ /dev/null
@@ -1,609 +0,0 @@
-#ifndef TASK_H
-#define TASK_H
-
-#include <unordered_map>
-
-#include <stddef.h>
-#include <stdint.h>
-#include "common.h"
-
-#include <string>
-
-#include "format/common_generated.h"
-
-using namespace ray;
-
-typedef char TaskSpec;
-
-class TaskExecutionSpec {
- public:
-  TaskExecutionSpec(const std::vector<ObjectID> &execution_dependencies,
-                    const TaskSpec *spec,
-                    int64_t task_spec_size);
-  TaskExecutionSpec(const std::vector<ObjectID> &execution_dependencies,
-                    const TaskSpec *spec,
-                    int64_t task_spec_size,
-                    int spillback_count);
-  TaskExecutionSpec(TaskExecutionSpec *execution_spec);
-
-  /// Get the task's execution dependencies.
-  ///
-  /// @return A vector of object IDs representing this task's execution
-  ///         dependencies.
-  const std::vector<ObjectID> &ExecutionDependencies() const;
-
-  /// Set the task's execution dependencies.
-  ///
-  /// @param dependencies The value to set the execution dependencies to.
-  /// @return Void.
-  void SetExecutionDependencies(const std::vector<ObjectID> &dependencies);
-
-  /// Get the task spec size.
-  ///
-  /// @return The size of the immutable task spec.
-  int64_t SpecSize() const;
-
-  /// Get the task's spillback count, which tracks the number of times
-  /// this task was spilled back from local to the global scheduler.
-  ///
-  /// @return The spillback count for this task.
-  int SpillbackCount() const;
-
-  /// Increment the spillback count for this task.
-  ///
-  /// @return Void.
-  void IncrementSpillbackCount();
-
-  /// Get the task's last timestamp.
-  ///
-  /// @return The timestamp when this task was last received for scheduling.
-  int64_t LastTimeStamp() const;
-
-  /// Set the task's last timestamp to the specified value.
-  ///
-  /// @param new_timestamp The new timestamp in millisecond to set the task's
-  ///        time stamp to. Tracks the last time this task entered a local
-  ///        scheduler.
-  /// @return Void.
-  void SetLastTimeStamp(int64_t new_timestamp);
-
-  /// Get the task spec.
-  ///
-  /// @return A pointer to the immutable task spec.
-  TaskSpec *Spec() const;
-
-  /// Get the number of dependencies. This comprises the immutable task
-  /// arguments and the mutable execution dependencies.
-  ///
-  /// @return The number of dependencies.
-  int64_t NumDependencies() const;
-
-  /// Get the number of object IDs at the given dependency index.
-  ///
-  /// @param dependency_index The dependency index whose object IDs to count.
-  /// @return The number of object IDs at the given dependency_index.
-  int DependencyIdCount(int64_t dependency_index) const;
-
-  /// Get the object ID of a given dependency index.
-  ///
-  /// @param dependency_index The index at which we should look up the object
-  ///        ID.
-  /// @param id_index The index of the object ID.
-  ObjectID DependencyId(int64_t dependency_index, int64_t id_index) const;
-
-  /// Compute whether the task is dependent on an object ID.
-  ///
-  /// @param object_id The object ID that the task may be dependent on.
-  /// @return bool This returns true if the task is dependent on the given
-  ///         object ID and false otherwise.
-  bool DependsOn(ObjectID object_id) const;
-
-  /// Returns whether the given dependency index is a static dependency (an
-  /// argument of the immutable task).
-  ///
-  /// @param dependency_index The requested dependency index.
-  /// @return bool This returns true if the requested dependency index is
-  ///         immutable (an argument of the task).
-  bool IsStaticDependency(int64_t dependency_index) const;
-
- private:
-  /** A list of object IDs representing this task's dependencies at execution
-   *  time. */
-  std::vector<ObjectID> execution_dependencies_;
-  /** The size of the task specification for this task. */
-  int64_t task_spec_size_;
-  /** Last time this task was received for scheduling. */
-  int64_t last_timestamp_;
-  /** Number of times this task was spilled back by local schedulers. */
-  int spillback_count_;
-  /** The task specification for this task. */
-  std::unique_ptr<TaskSpec[]> spec_;
-};
-
-class TaskBuilder;
-
-typedef UniqueID FunctionID;
-
-/** The task ID is a deterministic hash of the function ID that the task
- *  executes and the argument IDs or argument values. */
-typedef UniqueID TaskID;
-
-/** The actor ID is the ID of the actor that a task must run on. If the task is
- *  not run on an actor, then NIL_ACTOR_ID should be used. */
-typedef UniqueID ActorID;
-
-/**
- * Compare two task IDs.
- *
- * @param first_id The first task ID to compare.
- * @param second_id The first task ID to compare.
- * @return True if the task IDs are the same and false otherwise.
- */
-bool TaskID_equal(TaskID first_id, TaskID second_id);
-
-/**
- * Compare a task ID to the nil ID.
- *
- * @param id The task ID to compare to nil.
- * @return True if the task ID is equal to nil.
- */
-bool TaskID_is_nil(TaskID id);
-
-/**
- * Compare two actor IDs.
- *
- * @param first_id The first actor ID to compare.
- * @param second_id The first actor ID to compare.
- * @return True if the actor IDs are the same and false otherwise.
- */
-bool ActorID_equal(ActorID first_id, ActorID second_id);
-
-/**
- * Compare two function IDs.
- *
- * @param first_id The first function ID to compare.
- * @param second_id The first function ID to compare.
- * @return True if the function IDs are the same and false otherwise.
- */
-bool FunctionID_equal(FunctionID first_id, FunctionID second_id);
-
-/**
- * Compare a function ID to the nil ID.
- *
- * @param id The function ID to compare to nil.
- * @return True if the function ID is equal to nil.
- */
-bool FunctionID_is_nil(FunctionID id);
-
-/* Construct and modify task specifications. */
-
-TaskBuilder *make_task_builder(void);
-
-void free_task_builder(TaskBuilder *builder);
-
-/**
- * Begin constructing a task_spec. After this is called, the arguments must be
- * added to the task_spec and then finish_construct_task_spec must be called.
- *
- * @param driver_id The ID of the driver whose job is responsible for the
- *        creation of this task.
- * @param parent_task_id The task ID of the task that submitted this task.
- * @param parent_counter A counter indicating how many tasks were submitted by
- *        the parent task prior to this one.
- * @param actor_creation_id The actor creation ID of this task.
- * @param actor_creation_dummy_object_id The dummy object for the corresponding
- *        actor creation task, assuming this is an actor method.
- * @param actor_id The ID of the actor that this task is for. If it is not an
- *        actor task, then this if NIL_ACTOR_ID.
- * @param actor_handle_id The ID of the actor handle that this task was
- *        submitted through. If it is not an actor task, or if this is the
- *        original handle, then this is NIL_ACTOR_ID.
- * @param actor_counter A counter indicating how many tasks have been submitted
- *        to the same actor before this one.
- * @param is_actor_checkpoint_method True if this is an actor checkpoint method
- *        and false otherwise.
- * @param function_id The function ID of the function to execute in this task.
- * @param num_args The number of arguments that this task has.
- * @param num_returns The number of return values that this task has.
- * @param args_value_size The total size in bytes of the arguments to this task
-          ignoring object ID arguments.
- * @return The partially constructed task_spec.
- */
-void TaskSpec_start_construct(TaskBuilder *B,
-                              UniqueID driver_id,
-                              TaskID parent_task_id,
-                              int64_t parent_counter,
-                              ActorID actor_creation_id,
-                              ObjectID actor_creation_dummy_object_id,
-                              ActorID actor_id,
-                              ActorHandleID actor_handle_id,
-                              int64_t actor_counter,
-                              bool is_actor_checkpoint_method,
-                              FunctionID function_id,
-                              int64_t num_returns);
-
-/**
- * Finish constructing a task_spec. This computes the task ID and the object IDs
- * of the task return values. This must be called after all of the arguments
- * have been added to the task.
- *
- * @param spec The task spec whose ID and return object IDs should be computed.
- * @return Void.
- */
-TaskSpec *TaskSpec_finish_construct(TaskBuilder *builder, int64_t *size);
-
-/**
- * Return the function ID of the task.
- *
- * @param spec The task_spec in question.
- * @return The function ID of the function to execute in this task.
- */
-FunctionID TaskSpec_function(TaskSpec *spec);
-
-/**
- * Return the actor ID of the task.
- *
- * @param spec The task_spec in question.
- * @return The actor ID of the actor the task is part of.
- */
-ActorID TaskSpec_actor_id(TaskSpec *spec);
-
-/**
- * Return the actor handle ID of the task.
- *
- * @param spec The task_spec in question.
- * @return The ID of the actor handle that the task was submitted through.
- */
-ActorID TaskSpec_actor_handle_id(TaskSpec *spec);
-
-/**
- * Return whether this task is for an actor.
- *
- * @param spec The task_spec in question.
- * @return Whether the task is for an actor.
- */
-bool TaskSpec_is_actor_task(TaskSpec *spec);
-
-/// Return whether this task is an actor creation task or not.
-///
-/// \param spec The task_spec in question.
-/// \return True if this task is an actor creation task and false otherwise.
-bool TaskSpec_is_actor_creation_task(TaskSpec *spec);
-
-/// Return the actor creation ID of the task. The task must be an actor creation
-/// task.
-///
-/// \param spec The task_spec in question.
-/// \return The actor creation ID if this is an actor creation task.
-ActorID TaskSpec_actor_creation_id(TaskSpec *spec);
-
-/// Return the actor creation dummy object ID of the task. The task must be an
-/// actor task.
-///
-/// \param spec The task_spec in question.
-/// \return The actor creation dummy object ID corresponding to this actor task.
-ObjectID TaskSpec_actor_creation_dummy_object_id(TaskSpec *spec);
-
-/**
- * Return the actor counter of the task. This starts at 0 and increments by 1
- * every time a new task is submitted to run on the actor.
- *
- * @param spec The task_spec in question.
- * @return The actor counter of the task.
- */
-int64_t TaskSpec_actor_counter(TaskSpec *spec);
-
-/**
- * Return whether the task is a checkpoint method execution.
- *
- * @param spec The task_spec in question.
- * @return Whether the task is a checkpoint method.
- */
-bool TaskSpec_is_actor_checkpoint_method(TaskSpec *spec);
-
-/**
- * Return an actor task's dummy return value. Dummy objects are used to
- * encode an actor's state dependencies in the task graph. The dummy object
- * is local if and only if the task that returned it has completed
- * execution.
- *
- * @param spec The task_spec in question.
- * @return The dummy object ID that the actor task will return.
- */
-ObjectID TaskSpec_actor_dummy_object(TaskSpec *spec);
-
-/**
- * Return the driver ID of the task.
- *
- * @param spec The task_spec in question.
- * @return The driver ID of the task.
- */
-UniqueID TaskSpec_driver_id(const TaskSpec *spec);
-
-/**
- * Return the task ID of the parent task.
- *
- * @param spec The task_spec in question.
- * @return The task ID of the parent task.
- */
-TaskID TaskSpec_parent_task_id(const TaskSpec *spec);
-
-/**
- * Return the task counter of the parent task. For example, this equals 5 if
- * this task was the 6th task submitted by the parent task.
- *
- * @param spec The task_spec in question.
- * @return The task counter of the parent task.
- */
-int64_t TaskSpec_parent_counter(TaskSpec *spec);
-
-/**
- * Return the task ID of the task.
- *
- * @param spec The task_spec in question.
- * @return The task ID of the task.
- */
-TaskID TaskSpec_task_id(const TaskSpec *spec);
-
-/**
- * Get the number of arguments to this task.
- *
- * @param spec The task_spec in question.
- * @return The number of arguments to this task.
- */
-int64_t TaskSpec_num_args(TaskSpec *spec);
-
-/**
- * Get the number of return values expected from this task.
- *
- * @param spec The task_spec in question.
- * @return The number of return values expected from this task.
- */
-int64_t TaskSpec_num_returns(TaskSpec *spec);
-
-/**
- * Return true if this argument is passed by reference.
- *
- * @param spec The task_spec in question.
- * @param arg_index The index of the argument in question.
- * @return True if this argument is passed by reference.
- */
-bool TaskSpec_arg_by_ref(TaskSpec *spec, int64_t arg_index);
-
-/**
- * Get number of object IDs in a given argument
- *
- * @param spec The task_spec in question.
- * @param arg_index The index of the argument in question.
- * @return number of object IDs in this argument
- */
-int TaskSpec_arg_id_count(TaskSpec *spec, int64_t arg_index);
-
-/**
- * Get a particular argument to this task. This assumes the argument is an
- * object ID.
- *
- * @param spec The task_spec in question.
- * @param arg_index The index of the argument in question.
- * @param id_index The index of the object ID in this arg.
- * @return The argument at that index.
- */
-ObjectID TaskSpec_arg_id(TaskSpec *spec, int64_t arg_index, int64_t id_index);
-
-/**
- * Get a particular argument to this task. This assumes the argument is a value.
- *
- * @param spec The task_spec in question.
- * @param arg_index The index of the argument in question.
- * @return The argument at that index.
- */
-const uint8_t *TaskSpec_arg_val(TaskSpec *spec, int64_t arg_index);
-
-/**
- * Get the number of bytes in a particular argument to this task. This assumes
- * the argument is a value.
- *
- * @param spec The task_spec in question.
- * @param arg_index The index of the argument in question.
- * @return The number of bytes in the argument.
- */
-int64_t TaskSpec_arg_length(TaskSpec *spec, int64_t arg_index);
-
-/**
- * Set the next task argument. Note that this API only allows you to set the
- * arguments in their order of appearance.
- *
- * @param spec The task_spec in question.
- * @param object_ids The object IDs to set the argument to.
- * @param num_object_ids number of IDs in this param, usually 1.
- * @return The number of task arguments that have been set before this one. This
- *         is only used for testing.
- */
-void TaskSpec_args_add_ref(TaskBuilder *spec,
-                           ObjectID object_ids[],
-                           int num_object_ids);
-
-/**
- * Set the next task argument. Note that this API only allows you to set the
- * arguments in their order of appearance.
- *
- * @param spec The task_spec in question.
- * @param The value to set the argument to.
- * @param The length of the value to set the argument to.
- * @return The number of task arguments that have been set before this one. This
- *         is only used for testing.
- */
-void TaskSpec_args_add_val(TaskBuilder *builder,
-                           uint8_t *value,
-                           int64_t length);
-
-/**
- * Set the value associated to a resource index.
- *
- * @param spec Task specification.
- * @param resource_name Name of the resource in the resource vector.
- * @param value Value for the resource. This can be a quantity of this resource
- *        this task needs or a value for an attribute this task requires.
- * @return Void.
- */
-void TaskSpec_set_required_resource(TaskBuilder *builder,
-                                    const std::string &resource_name,
-                                    double value);
-
-/**
- * Get a particular return object ID of a task.
- *
- * @param spec The task_spec in question.
- * @param return_index The index of the return object ID in question.
- * @return The relevant return object ID.
- */
-ObjectID TaskSpec_return(TaskSpec *data, int64_t return_index);
-
-/**
- * Get the value associated to a resource name.
- *
- * @param spec Task specification.
- * @param resource_name Name of the resource.
- * @return How many of this resource the task needs to execute.
- */
-double TaskSpec_get_required_resource(const TaskSpec *spec,
-                                      const std::string &resource_name);
-
-/**
- *
- */
-const std::unordered_map<std::string, double> TaskSpec_get_required_resources(
-    const TaskSpec *spec);
-
-/**
- * Compute the object id associated to a put call.
- *
- * @param task_id The task id of the parent task that called the put.
- * @param put_index The number of put calls in this task so far.
- * @return The object ID for the object that was put.
- */
-ObjectID task_compute_put_id(TaskID task_id, int64_t put_index);
-
-/**
- * Print the task as a humanly readable string.
- *
- * @param spec The task_spec in question.
- * @return The humanly readable string.
- */
-std::string TaskSpec_print(TaskSpec *spec);
-
-/**
- * Create a copy of the task spec. Must be freed with TaskSpec_free after use.
- *
- * @param spec The task specification that will be copied.
- * @param task_spec_size The size of the task specification in bytes.
- * @returns Pointer to the copy of the task specification.
- */
-TaskSpec *TaskSpec_copy(TaskSpec *spec, int64_t task_spec_size);
-
-/**
- * Free a task_spec.
- *
- * @param The task_spec in question.
- * @return Void.
- */
-void TaskSpec_free(TaskSpec *spec);
-
-/**
- * ==== Task ====
- * Contains information about a scheduled task: The task specification, the
- * task scheduling state (WAITING, SCHEDULED, QUEUED, RUNNING, DONE), and which
- * local scheduler the task is scheduled on.
- */
-
-/** The scheduling_state can be used as a flag when we are listening
- *  for an event, for example TASK_WAITING | TASK_SCHEDULED. */
-enum class TaskStatus : uint {
-  /** The task is waiting to be scheduled. */
-  WAITING = 1,
-  /** The task has been scheduled to a node, but has not been queued yet. */
-  SCHEDULED = 2,
-  /** The task has been queued on a node, where it will wait for its
-   *  dependencies to become ready and a worker to become available. */
-  QUEUED = 4,
-  /** The task is running on a worker. */
-  RUNNING = 8,
-  /** The task is done executing. */
-  DONE = 16,
-  /** The task was not able to finish. */
-  LOST = 32,
-  /** The task will be submitted for reexecution. */
-  RECONSTRUCTING = 64,
-  /** An actor task is cached at a local scheduler and is waiting for the
-   *  corresponding actor to be created. */
-  ACTOR_CACHED = 128
-};
-
-inline TaskStatus operator|(const TaskStatus &a, const TaskStatus &b) {
-  uint c = static_cast<uint>(a) | static_cast<uint>(b);
-  return static_cast<TaskStatus>(c);
-}
-
-/** A task is an execution of a task specification.  It has a state of execution
- * (see scheduling_state) and the ID of the local scheduler it is scheduled on
- * or running on. */
-
-struct Task {
-  /** The scheduling state of the task. */
-  TaskStatus state;
-  /** The ID of the local scheduler involved. */
-  DBClientID local_scheduler_id;
-  /** The execution specification for this task. */
-  std::unique_ptr<TaskExecutionSpec> execution_spec;
-};
-
-/**
- * Allocate a new task. Must be freed with free_task after use.
- *
- * @param spec The task spec for the new task.
- * @param state The scheduling state for the new task.
- * @param local_scheduler_id The ID of the local scheduler that the task is
- *        scheduled on, if any.
- */
-Task *Task_alloc(const TaskSpec *spec,
-                 int64_t task_spec_size,
-                 TaskStatus state,
-                 DBClientID local_scheduler_id,
-                 const std::vector<ObjectID> &execution_dependencies);
-
-Task *Task_alloc(TaskExecutionSpec &execution_spec,
-                 TaskStatus state,
-                 DBClientID local_scheduler_id);
-
-/**
- * Create a copy of the task. Must be freed with Task_free after use.
- *
- * @param other The task that will be copied.
- * @returns Pointer to the copy of the task.
- */
-Task *Task_copy(Task *other);
-
-/** Size of task structure in bytes. */
-int64_t Task_size(Task *task);
-
-/** The scheduling state of the task. */
-TaskStatus Task_state(Task *task);
-
-/** Update the schedule state of the task. */
-void Task_set_state(Task *task, TaskStatus state);
-
-/** Local scheduler this task has been assigned to or is running on. */
-DBClientID Task_local_scheduler(Task *task);
-
-/** Set the local scheduler ID for this task. */
-void Task_set_local_scheduler(Task *task, DBClientID local_scheduler_id);
-
-TaskExecutionSpec *Task_task_execution_spec(Task *task);
-
-/** Task ID of this task. */
-TaskID Task_task_id(Task *task);
-
-/** Free this task datastructure. */
-void Task_free(Task *task);
-
-#endif /* TASK_H */
diff --git a/src/common/test/db_tests.cc b/src/common/test/db_tests.cc
deleted file mode 100644
index 83585ca66e0f9..0000000000000
--- a/src/common/test/db_tests.cc
+++ /dev/null
@@ -1,246 +0,0 @@
-#include "greatest.h"
-
-#include <assert.h>
-#include <unistd.h>
-#include <sys/wait.h>
-
-#include "event_loop.h"
-#include "test_common.h"
-#include "example_task.h"
-#include "net.h"
-#include "state/db.h"
-#include "state/db_client_table.h"
-#include "state/object_table.h"
-#include "state/task_table.h"
-#include "state/redis.h"
-#include "task.h"
-
-SUITE(db_tests);
-
-TaskBuilder *g_task_builder = NULL;
-
-/* Retry 10 times with an 100ms timeout. */
-const int NUM_RETRIES = 10;
-const uint64_t TIMEOUT = 50;
-
-const char *manager_addr = "127.0.0.1";
-int manager_port1 = 12345;
-int manager_port2 = 12346;
-char received_addr1[16] = {0};
-int received_port1;
-char received_addr2[16] = {0};
-int received_port2;
-
-typedef struct { int test_number; } user_context;
-
-const int TEST_NUMBER = 10;
-
-/* Test if entries have been written to the database. */
-
-void lookup_done_callback(ObjectID object_id,
-                          bool never_created,
-                          const std::vector<DBClientID> &manager_ids,
-                          void *user_context) {
-  DBHandle *db = (DBHandle *) user_context;
-  RAY_CHECK(manager_ids.size() == 2);
-  const std::vector<std::string> managers =
-      db_client_table_get_ip_addresses(db, manager_ids);
-  RAY_CHECK(parse_ip_addr_port(managers.at(0).c_str(), received_addr1,
-                               &received_port1) == 0);
-  RAY_CHECK(parse_ip_addr_port(managers.at(1).c_str(), received_addr2,
-                               &received_port2) == 0);
-}
-
-/* Entry added to database successfully. */
-void add_done_callback(ObjectID object_id, bool success, void *user_context) {}
-
-/* Test if we got a timeout callback if we couldn't connect database. */
-void timeout_callback(ObjectID object_id, void *context, void *user_data) {
-  user_context *uc = (user_context *) context;
-  RAY_CHECK(uc->test_number == TEST_NUMBER);
-}
-
-int64_t timeout_handler(event_loop *loop, int64_t id, void *context) {
-  event_loop_stop(loop);
-  return EVENT_LOOP_TIMER_DONE;
-}
-
-TEST object_table_lookup_test(void) {
-  event_loop *loop = event_loop_create();
-  /* This uses manager_port1. */
-  std::vector<std::string> db_connect_args1;
-  db_connect_args1.push_back("manager_address");
-  db_connect_args1.push_back("127.0.0.1:12345");
-  DBHandle *db1 = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                             manager_addr, db_connect_args1);
-  /* This uses manager_port2. */
-  std::vector<std::string> db_connect_args2;
-  db_connect_args2.push_back("manager_address");
-  db_connect_args2.push_back("127.0.0.1:12346");
-  DBHandle *db2 = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                             manager_addr, db_connect_args2);
-  db_attach(db1, loop, false);
-  db_attach(db2, loop, false);
-  UniqueID id = UniqueID::from_random();
-  RetryInfo retry = {
-      .num_retries = NUM_RETRIES,
-      .timeout = TIMEOUT,
-      .fail_callback = timeout_callback,
-  };
-  object_table_add(db1, id, 0, (unsigned char *) NIL_DIGEST, &retry,
-                   add_done_callback, NULL);
-  object_table_add(db2, id, 0, (unsigned char *) NIL_DIGEST, &retry,
-                   add_done_callback, NULL);
-  event_loop_add_timer(loop, 200, (event_loop_timer_handler) timeout_handler,
-                       NULL);
-  event_loop_run(loop);
-  object_table_lookup(db1, id, &retry, lookup_done_callback, db1);
-  event_loop_add_timer(loop, 200, (event_loop_timer_handler) timeout_handler,
-                       NULL);
-  event_loop_run(loop);
-  ASSERT_STR_EQ(&received_addr1[0], manager_addr);
-  ASSERT((received_port1 == manager_port1 && received_port2 == manager_port2) ||
-         (received_port2 == manager_port1 && received_port1 == manager_port2));
-
-  db_disconnect(db1);
-  db_disconnect(db2);
-
-  destroy_outstanding_callbacks(loop);
-  event_loop_destroy(loop);
-  PASS();
-}
-
-int task_table_test_callback_called = 0;
-Task *task_table_test_task;
-
-void task_table_test_fail_callback(UniqueID id,
-                                   void *context,
-                                   void *user_data) {
-  event_loop *loop = (event_loop *) user_data;
-  event_loop_stop(loop);
-}
-
-int64_t task_table_delayed_add_task(event_loop *loop,
-                                    int64_t id,
-                                    void *context) {
-  DBHandle *db = (DBHandle *) context;
-  RetryInfo retry = {
-      .num_retries = NUM_RETRIES,
-      .timeout = TIMEOUT,
-      .fail_callback = task_table_test_fail_callback,
-  };
-  task_table_add_task(db, Task_copy(task_table_test_task), &retry, NULL,
-                      (void *) loop);
-  return EVENT_LOOP_TIMER_DONE;
-}
-
-void task_table_test_callback(Task *callback_task, void *user_data) {
-  task_table_test_callback_called = 1;
-  RAY_CHECK(Task_state(callback_task) == TaskStatus::SCHEDULED);
-  RAY_CHECK(Task_size(callback_task) == Task_size(task_table_test_task));
-  RAY_CHECK(Task_equals(callback_task, task_table_test_task));
-  event_loop *loop = (event_loop *) user_data;
-  event_loop_stop(loop);
-}
-
-TEST task_table_test(void) {
-  task_table_test_callback_called = 0;
-  event_loop *loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "local_scheduler",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, loop, false);
-  DBClientID local_scheduler_id = DBClientID::from_random();
-  TaskExecutionSpec spec = example_task_execution_spec(1, 1);
-  task_table_test_task =
-      Task_alloc(spec, TaskStatus::SCHEDULED, local_scheduler_id);
-  RetryInfo retry = {
-      .num_retries = NUM_RETRIES,
-      .timeout = TIMEOUT,
-      .fail_callback = task_table_test_fail_callback,
-  };
-  task_table_subscribe(db, local_scheduler_id, TaskStatus::SCHEDULED,
-                       task_table_test_callback, (void *) loop, &retry, NULL,
-                       (void *) loop);
-  event_loop_add_timer(
-      loop, 200, (event_loop_timer_handler) task_table_delayed_add_task, db);
-  event_loop_run(loop);
-  Task_free(task_table_test_task);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(loop);
-  event_loop_destroy(loop);
-  ASSERT(task_table_test_callback_called);
-  PASS();
-}
-
-int num_test_callback_called = 0;
-
-void task_table_all_test_callback(Task *task, void *user_data) {
-  num_test_callback_called += 1;
-}
-
-TEST task_table_all_test(void) {
-  event_loop *loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "local_scheduler",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, loop, false);
-  TaskExecutionSpec spec = example_task_execution_spec(1, 1);
-  /* Schedule two tasks on different local local schedulers. */
-  Task *task1 =
-      Task_alloc(spec, TaskStatus::SCHEDULED, DBClientID::from_random());
-  Task *task2 =
-      Task_alloc(spec, TaskStatus::SCHEDULED, DBClientID::from_random());
-  RetryInfo retry = {
-      .num_retries = NUM_RETRIES, .timeout = TIMEOUT, .fail_callback = NULL,
-  };
-  task_table_subscribe(db, UniqueID::nil(), TaskStatus::SCHEDULED,
-                       task_table_all_test_callback, NULL, &retry, NULL, NULL);
-  event_loop_add_timer(loop, 50, (event_loop_timer_handler) timeout_handler,
-                       NULL);
-  event_loop_run(loop);
-  /* TODO(pcm): Get rid of this sleep once the robust pubsub is implemented. */
-  task_table_add_task(db, task1, &retry, NULL, NULL);
-  task_table_add_task(db, task2, &retry, NULL, NULL);
-  event_loop_add_timer(loop, 200, (event_loop_timer_handler) timeout_handler,
-                       NULL);
-  event_loop_run(loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(loop);
-  event_loop_destroy(loop);
-  ASSERT(num_test_callback_called == 2);
-  PASS();
-}
-
-TEST unique_client_id_test(void) {
-  const int num_conns = 100;
-
-  DBClientID ids[num_conns];
-  DBHandle *db;
-  for (int i = 0; i < num_conns; ++i) {
-    db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                    "127.0.0.1", std::vector<std::string>());
-    ids[i] = get_db_client_id(db);
-    db_disconnect(db);
-  }
-  for (int i = 0; i < num_conns; ++i) {
-    for (int j = 0; j < i; ++j) {
-      ASSERT(!(ids[i] == ids[j]));
-    }
-  }
-  PASS();
-}
-
-SUITE(db_tests) {
-  RUN_REDIS_TEST(object_table_lookup_test);
-  RUN_REDIS_TEST(task_table_test);
-  RUN_REDIS_TEST(task_table_all_test);
-  RUN_REDIS_TEST(unique_client_id_test);
-}
-
-GREATEST_MAIN_DEFS();
-
-int main(int argc, char **argv) {
-  g_task_builder = make_task_builder();
-  GREATEST_MAIN_BEGIN();
-  RUN_SUITE(db_tests);
-  GREATEST_MAIN_END();
-}
diff --git a/src/common/test/example_task.h b/src/common/test/example_task.h
deleted file mode 100644
index f90cab68f6d95..0000000000000
--- a/src/common/test/example_task.h
+++ /dev/null
@@ -1,77 +0,0 @@
-#ifndef EXAMPLE_TASK_H
-#define EXAMPLE_TASK_H
-
-#include "task.h"
-
-extern TaskBuilder *g_task_builder;
-
-const int64_t arg_value_size = 1000;
-
-static inline TaskExecutionSpec example_task_execution_spec_with_args(
-    int64_t num_args,
-    int64_t num_returns,
-    ObjectID arg_ids[]) {
-  TaskID parent_task_id = TaskID::from_random();
-  FunctionID func_id = FunctionID::from_random();
-  TaskSpec_start_construct(g_task_builder, UniqueID::nil(), parent_task_id, 0,
-                           ActorID::nil(), ObjectID::nil(), ActorID::nil(),
-                           ActorID::nil(), 0, false, func_id, num_returns);
-  for (int64_t i = 0; i < num_args; ++i) {
-    ObjectID arg_id;
-    if (arg_ids == NULL) {
-      arg_id = ObjectID::from_random();
-    } else {
-      arg_id = arg_ids[i];
-    }
-    TaskSpec_args_add_ref(g_task_builder, &arg_id, 1);
-  }
-  int64_t task_spec_size;
-  TaskSpec *spec = TaskSpec_finish_construct(g_task_builder, &task_spec_size);
-  std::vector<ObjectID> execution_dependencies;
-  auto execution_spec =
-      TaskExecutionSpec(execution_dependencies, spec, task_spec_size);
-  TaskSpec_free(spec);
-  return execution_spec;
-}
-
-static inline TaskExecutionSpec example_task_execution_spec(
-    int64_t num_args,
-    int64_t num_returns) {
-  return example_task_execution_spec_with_args(num_args, num_returns, NULL);
-}
-
-static inline Task *example_task_with_args(int64_t num_args,
-                                           int64_t num_returns,
-                                           TaskStatus task_state,
-                                           ObjectID arg_ids[]) {
-  TaskExecutionSpec spec =
-      example_task_execution_spec_with_args(num_args, num_returns, arg_ids);
-  Task *instance = Task_alloc(spec, task_state, UniqueID::nil());
-  return instance;
-}
-
-static inline Task *example_task(int64_t num_args,
-                                 int64_t num_returns,
-                                 TaskStatus task_state) {
-  TaskExecutionSpec spec = example_task_execution_spec(num_args, num_returns);
-  Task *instance = Task_alloc(spec, task_state, UniqueID::nil());
-  return instance;
-}
-
-static inline bool Task_equals(Task *task1, Task *task2) {
-  if (task1->state != task2->state) {
-    return false;
-  }
-  if (!(task1->local_scheduler_id == task2->local_scheduler_id)) {
-    return false;
-  }
-  auto execution_spec1 = Task_task_execution_spec(task1);
-  auto execution_spec2 = Task_task_execution_spec(task2);
-  if (execution_spec1->SpecSize() != execution_spec2->SpecSize()) {
-    return false;
-  }
-  return memcmp(execution_spec1->Spec(), execution_spec2->Spec(),
-                execution_spec1->SpecSize()) == 0;
-}
-
-#endif /* EXAMPLE_TASK_H */
diff --git a/src/common/test/io_tests.cc b/src/common/test/io_tests.cc
deleted file mode 100644
index 092ca97b7d56d..0000000000000
--- a/src/common/test/io_tests.cc
+++ /dev/null
@@ -1,114 +0,0 @@
-#include "greatest.h"
-
-#include <assert.h>
-#include <unistd.h>
-#include <inttypes.h>
-
-#include <sstream>
-#include <string>
-
-#include "io.h"
-
-SUITE(io_tests);
-
-TEST ipc_socket_test(void) {
-#ifndef _WIN32
-  const char *socket_pathname = "/tmp/test-socket";
-  int socket_fd = bind_ipc_sock(socket_pathname, true);
-  ASSERT(socket_fd >= 0);
-
-  const char *test_string = "hello world";
-  const char *test_bytes = "another string";
-  pid_t pid = fork();
-  if (pid == 0) {
-    close(socket_fd);
-    socket_fd = connect_ipc_sock(socket_pathname);
-    ASSERT(socket_fd >= 0);
-    write_log_message(socket_fd, test_string);
-    write_message(socket_fd,
-                  static_cast<int64_t>(CommonMessageType::LOG_MESSAGE),
-                  strlen(test_bytes), (uint8_t *) test_bytes);
-    close(socket_fd);
-    exit(0);
-  } else {
-    int client_fd = accept_client(socket_fd);
-    ASSERT(client_fd >= 0);
-    char *message = read_log_message(client_fd);
-    ASSERT(message != NULL);
-    ASSERT_STR_EQ(test_string, message);
-    free(message);
-    int64_t type;
-    int64_t len;
-    uint8_t *bytes;
-    read_message(client_fd, &type, &len, &bytes);
-    ASSERT(static_cast<CommonMessageType>(type) ==
-           CommonMessageType::LOG_MESSAGE);
-    ASSERT(memcmp(test_bytes, bytes, len) == 0);
-    free(bytes);
-    close(client_fd);
-    close(socket_fd);
-    unlink(socket_pathname);
-  }
-#endif
-  PASS();
-}
-
-TEST long_ipc_socket_test(void) {
-#ifndef _WIN32
-  const char *socket_pathname = "/tmp/long-test-socket";
-  int socket_fd = bind_ipc_sock(socket_pathname, true);
-  ASSERT(socket_fd >= 0);
-
-  std::stringstream test_string_ss;
-  for (int i = 0; i < 10000; i++) {
-    test_string_ss << "hello world ";
-  }
-  std::string test_string = test_string_ss.str();
-  const char *test_bytes = "another string";
-  pid_t pid = fork();
-  if (pid == 0) {
-    close(socket_fd);
-    socket_fd = connect_ipc_sock(socket_pathname);
-    ASSERT(socket_fd >= 0);
-    write_log_message(socket_fd, test_string.c_str());
-    write_message(socket_fd,
-                  static_cast<int64_t>(CommonMessageType::LOG_MESSAGE),
-                  strlen(test_bytes), (uint8_t *) test_bytes);
-    close(socket_fd);
-    exit(0);
-  } else {
-    int client_fd = accept_client(socket_fd);
-    ASSERT(client_fd >= 0);
-    char *message = read_log_message(client_fd);
-    ASSERT(message != NULL);
-    ASSERT_STR_EQ(test_string.c_str(), message);
-    free(message);
-    int64_t type;
-    int64_t len;
-    uint8_t *bytes;
-    read_message(client_fd, &type, &len, &bytes);
-    ASSERT(static_cast<CommonMessageType>(type) ==
-           CommonMessageType::LOG_MESSAGE);
-    ASSERT(memcmp(test_bytes, bytes, len) == 0);
-    free(bytes);
-    close(client_fd);
-    close(socket_fd);
-    unlink(socket_pathname);
-  }
-
-#endif
-  PASS();
-}
-
-SUITE(io_tests) {
-  RUN_TEST(ipc_socket_test);
-  RUN_TEST(long_ipc_socket_test);
-}
-
-GREATEST_MAIN_DEFS();
-
-int main(int argc, char **argv) {
-  GREATEST_MAIN_BEGIN();
-  RUN_SUITE(io_tests);
-  GREATEST_MAIN_END();
-}
diff --git a/src/common/test/object_table_tests.cc b/src/common/test/object_table_tests.cc
deleted file mode 100644
index 0599724386069..0000000000000
--- a/src/common/test/object_table_tests.cc
+++ /dev/null
@@ -1,919 +0,0 @@
-#include "greatest.h"
-
-#include "event_loop.h"
-#include "example_task.h"
-#include "test_common.h"
-#include "common.h"
-#include "state/db_client_table.h"
-#include "state/object_table.h"
-#include "state/redis.h"
-
-#include <unistd.h>
-
-SUITE(object_table_tests);
-
-static event_loop *g_loop;
-TaskBuilder *g_task_builder = NULL;
-
-/* ==== Test adding and looking up metadata ==== */
-
-int new_object_failed = 0;
-int new_object_succeeded = 0;
-ObjectID new_object_id;
-Task *new_object_task;
-TaskSpec *new_object_task_spec;
-TaskID new_object_task_id;
-
-void new_object_fail_callback(UniqueID id,
-                              void *user_context,
-                              void *user_data) {
-  new_object_failed = 1;
-  event_loop_stop(g_loop);
-}
-
-/* === Test adding an object with an associated task === */
-
-void new_object_done_callback(ObjectID object_id,
-                              TaskID task_id,
-                              bool is_put,
-                              void *user_context) {
-  new_object_succeeded = 1;
-  RAY_CHECK(object_id == new_object_id);
-  RAY_CHECK(task_id == new_object_task_id);
-  event_loop_stop(g_loop);
-}
-
-void new_object_lookup_callback(ObjectID object_id, void *user_context) {
-  RAY_CHECK(object_id == new_object_id);
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = new_object_fail_callback,
-  };
-  DBHandle *db = (DBHandle *) user_context;
-  result_table_lookup(db, new_object_id, &retry, new_object_done_callback,
-                      NULL);
-}
-
-void new_object_task_callback(TaskID task_id, void *user_context) {
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = new_object_fail_callback,
-  };
-  DBHandle *db = (DBHandle *) user_context;
-  result_table_add(db, new_object_id, new_object_task_id, false, &retry,
-                   new_object_lookup_callback, (void *) db);
-}
-
-void task_table_subscribe_done(TaskID task_id, void *user_context) {
-  RetryInfo retry = {
-      .num_retries = 5, .timeout = 100, .fail_callback = NULL,
-  };
-  DBHandle *db = (DBHandle *) user_context;
-  task_table_add_task(db, Task_copy(new_object_task), &retry,
-                      new_object_task_callback, db);
-}
-
-TEST new_object_test(void) {
-  new_object_failed = 0;
-  new_object_succeeded = 0;
-  new_object_id = ObjectID::from_random();
-  new_object_task = example_task(1, 1, TaskStatus::WAITING);
-  new_object_task_spec = Task_task_execution_spec(new_object_task)->Spec();
-  new_object_task_id = TaskSpec_task_id(new_object_task_spec);
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = new_object_fail_callback,
-  };
-  task_table_subscribe(db, UniqueID::nil(), TaskStatus::WAITING, NULL, NULL,
-                       &retry, task_table_subscribe_done, db);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(new_object_succeeded);
-  ASSERT(!new_object_failed);
-  PASS();
-}
-
-/* === Test adding an object without an associated task === */
-
-void new_object_no_task_callback(ObjectID object_id,
-                                 TaskID task_id,
-                                 bool is_put,
-                                 void *user_context) {
-  new_object_succeeded = 1;
-  RAY_CHECK(task_id.is_nil());
-  event_loop_stop(g_loop);
-}
-
-TEST new_object_no_task_test(void) {
-  new_object_failed = 0;
-  new_object_succeeded = 0;
-  new_object_id = ObjectID::from_random();
-  new_object_task_id = TaskID::from_random();
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = new_object_fail_callback,
-  };
-  result_table_lookup(db, new_object_id, &retry, new_object_no_task_callback,
-                      NULL);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(new_object_succeeded);
-  ASSERT(!new_object_failed);
-  PASS();
-}
-
-/* ==== Test if operations time out correctly ==== */
-
-/* === Test lookup timeout === */
-
-const char *lookup_timeout_context = "lookup_timeout";
-int lookup_failed = 0;
-
-void lookup_done_callback(ObjectID object_id,
-                          bool never_created,
-                          const std::vector<DBClientID> &manager_vector,
-                          void *context) {
-  /* The done callback should not be called. */
-  RAY_CHECK(0);
-}
-
-void lookup_fail_callback(UniqueID id, void *user_context, void *user_data) {
-  lookup_failed = 1;
-  RAY_CHECK(user_context == (void *) lookup_timeout_context);
-  event_loop_stop(g_loop);
-}
-
-TEST lookup_timeout_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 5, .timeout = 100, .fail_callback = lookup_fail_callback,
-  };
-  object_table_lookup(db, UniqueID::nil(), &retry, lookup_done_callback,
-                      (void *) lookup_timeout_context);
-  /* Disconnect the database to see if the lookup times out. */
-  close(db->context->c.fd);
-  for (auto context : db->contexts) {
-    close(context->c.fd);
-  }
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(lookup_failed);
-  PASS();
-}
-
-/* === Test add timeout === */
-
-const char *add_timeout_context = "add_timeout";
-int add_failed = 0;
-
-void add_done_callback(ObjectID object_id, bool success, void *user_context) {
-  /* The done callback should not be called. */
-  RAY_CHECK(0);
-}
-
-void add_fail_callback(UniqueID id, void *user_context, void *user_data) {
-  add_failed = 1;
-  RAY_CHECK(user_context == (void *) add_timeout_context);
-  event_loop_stop(g_loop);
-}
-
-TEST add_timeout_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 5, .timeout = 100, .fail_callback = add_fail_callback,
-  };
-  object_table_add(db, UniqueID::nil(), 0, (unsigned char *) NIL_DIGEST, &retry,
-                   add_done_callback, (void *) add_timeout_context);
-  /* Disconnect the database to see if the lookup times out. */
-  close(db->context->c.fd);
-  for (auto context : db->contexts) {
-    close(context->c.fd);
-  }
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(add_failed);
-  PASS();
-}
-
-/* === Test subscribe timeout === */
-
-int subscribe_failed = 0;
-
-void subscribe_done_callback(ObjectID object_id,
-                             int64_t data_size,
-                             const std::vector<DBClientID> &manager_vector,
-                             void *user_context) {
-  /* The done callback should not be called. */
-  RAY_CHECK(0);
-}
-
-void subscribe_fail_callback(UniqueID id, void *user_context, void *user_data) {
-  subscribe_failed = 1;
-  event_loop_stop(g_loop);
-}
-
-TEST subscribe_timeout_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = subscribe_fail_callback,
-  };
-  object_table_subscribe_to_notifications(db, false, subscribe_done_callback,
-                                          NULL, &retry, NULL, NULL);
-  /* Disconnect the database to see if the lookup times out. */
-  close(db->subscribe_context->c.fd);
-  for (auto subscribe_context : db->subscribe_contexts) {
-    close(subscribe_context->c.fd);
-  }
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(subscribe_failed);
-  PASS();
-}
-
-/* ==== Test if the retry is working correctly ==== */
-
-int64_t reconnect_context_callback(event_loop *loop,
-                                   int64_t timer_id,
-                                   void *context) {
-  DBHandle *db = (DBHandle *) context;
-  /* Reconnect to redis. This is not reconnecting the pub/sub channel. */
-  redisAsyncFree(db->context);
-  redisFree(db->sync_context);
-  db->context = redisAsyncConnect("127.0.0.1", 6379);
-  db->context->data = (void *) db;
-  db->sync_context = redisConnect("127.0.0.1", 6379);
-  /* Re-attach the database to the event loop (the file descriptor changed). */
-  db_attach(db, loop, true);
-  RAY_LOG(DEBUG) << "Reconnected to Redis";
-  return EVENT_LOOP_TIMER_DONE;
-}
-
-int64_t terminate_event_loop_callback(event_loop *loop,
-                                      int64_t timer_id,
-                                      void *context) {
-  event_loop_stop(loop);
-  return EVENT_LOOP_TIMER_DONE;
-}
-
-/* === Test lookup retry === */
-
-const char *lookup_retry_context = "lookup_retry";
-int lookup_retry_succeeded = 0;
-
-void lookup_retry_fail_callback(UniqueID id,
-                                void *user_context,
-                                void *user_data) {
-  /* The fail callback should not be called. */
-  RAY_CHECK(0);
-}
-
-/* === Test add retry === */
-
-const char *add_retry_context = "add_retry";
-int add_retry_succeeded = 0;
-
-/* === Test add then lookup retry === */
-
-void add_lookup_done_callback(ObjectID object_id,
-                              bool never_created,
-                              const std::vector<DBClientID> &manager_ids,
-                              void *context) {
-  DBHandle *db = (DBHandle *) context;
-  RAY_CHECK(manager_ids.size() == 1);
-  const std::vector<std::string> managers =
-      db_client_table_get_ip_addresses(db, manager_ids);
-  RAY_CHECK(managers.at(0) == "127.0.0.1:11235");
-  lookup_retry_succeeded = 1;
-}
-
-void add_lookup_callback(ObjectID object_id, bool success, void *user_context) {
-  RAY_CHECK(success);
-  DBHandle *db = (DBHandle *) user_context;
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = lookup_retry_fail_callback,
-  };
-  object_table_lookup(db, UniqueID::nil(), &retry, add_lookup_done_callback,
-                      (void *) db);
-}
-
-TEST add_lookup_test(void) {
-  g_loop = event_loop_create();
-  lookup_retry_succeeded = 0;
-  /* Construct the arguments to db_connect. */
-  std::vector<std::string> db_connect_args;
-  db_connect_args.push_back("manager_address");
-  db_connect_args.push_back("127.0.0.1:11235");
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", db_connect_args);
-  db_attach(db, g_loop, true);
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = lookup_retry_fail_callback,
-  };
-  object_table_add(db, UniqueID::nil(), 0, (unsigned char *) NIL_DIGEST, &retry,
-                   add_lookup_callback, (void *) db);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(lookup_retry_succeeded);
-  PASS();
-}
-
-/* === Test add, remove, then lookup === */
-void add_remove_lookup_done_callback(
-    ObjectID object_id,
-    bool never_created,
-    const std::vector<DBClientID> &manager_vector,
-    void *context) {
-  RAY_CHECK(context == (void *) lookup_retry_context);
-  RAY_CHECK(manager_vector.size() == 0);
-  lookup_retry_succeeded = 1;
-}
-
-void add_remove_lookup_callback(ObjectID object_id,
-                                bool success,
-                                void *user_context) {
-  RAY_CHECK(success);
-  DBHandle *db = (DBHandle *) user_context;
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = lookup_retry_fail_callback,
-  };
-  object_table_lookup(db, UniqueID::nil(), &retry,
-                      add_remove_lookup_done_callback,
-                      (void *) lookup_retry_context);
-}
-
-void add_remove_callback(ObjectID object_id, bool success, void *user_context) {
-  RAY_CHECK(success);
-  DBHandle *db = (DBHandle *) user_context;
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = lookup_retry_fail_callback,
-  };
-  object_table_remove(db, UniqueID::nil(), NULL, &retry,
-                      add_remove_lookup_callback, (void *) db);
-}
-
-TEST add_remove_lookup_test(void) {
-  g_loop = event_loop_create();
-  lookup_retry_succeeded = 0;
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, true);
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = lookup_retry_fail_callback,
-  };
-  object_table_add(db, UniqueID::nil(), 0, (unsigned char *) NIL_DIGEST, &retry,
-                   add_remove_callback, (void *) db);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(lookup_retry_succeeded);
-  PASS();
-}
-
-/* ==== Test if late succeed is working correctly ==== */
-
-/* === Test lookup late succeed === */
-
-const char *lookup_late_context = "lookup_late";
-int lookup_late_failed = 0;
-
-void lookup_late_fail_callback(UniqueID id,
-                               void *user_context,
-                               void *user_data) {
-  RAY_CHECK(user_context == (void *) lookup_late_context);
-  lookup_late_failed = 1;
-}
-
-void lookup_late_done_callback(ObjectID object_id,
-                               bool never_created,
-                               const std::vector<DBClientID> &manager_vector,
-                               void *context) {
-  /* This function should never be called. */
-  RAY_CHECK(0);
-}
-
-TEST lookup_late_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 0,
-      .timeout = 0,
-      .fail_callback = lookup_late_fail_callback,
-  };
-  object_table_lookup(db, UniqueID::nil(), &retry, lookup_late_done_callback,
-                      (void *) lookup_late_context);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* First process timer events to make sure the timeout is processed before
-   * anything else. */
-  aeProcessEvents(g_loop, AE_TIME_EVENTS);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(lookup_late_failed);
-  PASS();
-}
-
-/* === Test add late succeed === */
-
-const char *add_late_context = "add_late";
-int add_late_failed = 0;
-
-void add_late_fail_callback(UniqueID id, void *user_context, void *user_data) {
-  RAY_CHECK(user_context == (void *) add_late_context);
-  add_late_failed = 1;
-}
-
-void add_late_done_callback(ObjectID object_id,
-                            bool success,
-                            void *user_context) {
-  /* This function should never be called. */
-  RAY_CHECK(0);
-}
-
-TEST add_late_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 0, .timeout = 0, .fail_callback = add_late_fail_callback,
-  };
-  object_table_add(db, UniqueID::nil(), 0, (unsigned char *) NIL_DIGEST, &retry,
-                   add_late_done_callback, (void *) add_late_context);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* First process timer events to make sure the timeout is processed before
-   * anything else. */
-  aeProcessEvents(g_loop, AE_TIME_EVENTS);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(add_late_failed);
-  PASS();
-}
-
-/* === Test subscribe late succeed === */
-
-const char *subscribe_late_context = "subscribe_late";
-int subscribe_late_failed = 0;
-
-void subscribe_late_fail_callback(UniqueID id,
-                                  void *user_context,
-                                  void *user_data) {
-  RAY_CHECK(user_context == (void *) subscribe_late_context);
-  subscribe_late_failed = 1;
-}
-
-void subscribe_late_done_callback(ObjectID object_id,
-                                  bool never_created,
-                                  const std::vector<DBClientID> &manager_vector,
-                                  void *user_context) {
-  /* This function should never be called. */
-  RAY_CHECK(0);
-}
-
-TEST subscribe_late_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 0,
-      .timeout = 0,
-      .fail_callback = subscribe_late_fail_callback,
-  };
-  object_table_subscribe_to_notifications(db, false, NULL, NULL, &retry,
-                                          subscribe_late_done_callback,
-                                          (void *) subscribe_late_context);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* First process timer events to make sure the timeout is processed before
-   * anything else. */
-  aeProcessEvents(g_loop, AE_TIME_EVENTS);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(subscribe_late_failed);
-  PASS();
-}
-
-/* === Test subscribe object available succeed === */
-
-const char *subscribe_success_context = "subscribe_success";
-int subscribe_success_done = 0;
-int subscribe_success_succeeded = 0;
-ObjectID subscribe_id;
-
-void subscribe_success_fail_callback(UniqueID id,
-                                     void *user_context,
-                                     void *user_data) {
-  /* This function should never be called. */
-  RAY_CHECK(0);
-}
-
-void subscribe_success_done_callback(
-    ObjectID object_id,
-    bool never_created,
-    const std::vector<DBClientID> &manager_vector,
-    void *user_context) {
-  RetryInfo retry = {
-      .num_retries = 0, .timeout = 750, .fail_callback = NULL,
-  };
-  object_table_add((DBHandle *) user_context, subscribe_id, 0,
-                   (unsigned char *) NIL_DIGEST, &retry, NULL, NULL);
-  subscribe_success_done = 1;
-}
-
-void subscribe_success_object_available_callback(
-    ObjectID object_id,
-    int64_t data_size,
-    const std::vector<DBClientID> &manager_vector,
-    void *user_context) {
-  RAY_CHECK(user_context == (void *) subscribe_success_context);
-  RAY_CHECK(object_id == subscribe_id);
-  RAY_CHECK(manager_vector.size() == 1);
-  subscribe_success_succeeded = 1;
-}
-
-TEST subscribe_success_test(void) {
-  g_loop = event_loop_create();
-
-  /* Construct the arguments to db_connect. */
-  std::vector<std::string> db_connect_args;
-  db_connect_args.push_back("manager_address");
-  db_connect_args.push_back("127.0.0.1:11236");
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", db_connect_args);
-  db_attach(db, g_loop, false);
-  subscribe_id = ObjectID::from_random();
-
-  RetryInfo retry = {
-      .num_retries = 0,
-      .timeout = 100,
-      .fail_callback = subscribe_success_fail_callback,
-  };
-  object_table_subscribe_to_notifications(
-      db, false, subscribe_success_object_available_callback,
-      (void *) subscribe_success_context, &retry,
-      subscribe_success_done_callback, (void *) db);
-
-  ObjectID object_ids[1] = {subscribe_id};
-  object_table_request_notifications(db, 1, object_ids, &retry);
-
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-
-  ASSERT(subscribe_success_done);
-  ASSERT(subscribe_success_succeeded);
-  PASS();
-}
-
-/* Test if subscribe succeeds if the object is already present. */
-typedef struct {
-  const char *teststr;
-  int64_t data_size;
-} subscribe_object_present_context_t;
-
-const char *subscribe_object_present_str = "subscribe_object_present";
-int subscribe_object_present_succeeded = 0;
-
-void subscribe_object_present_object_available_callback(
-    ObjectID object_id,
-    int64_t data_size,
-    const std::vector<DBClientID> &manager_vector,
-    void *user_context) {
-  subscribe_object_present_context_t *ctx =
-      (subscribe_object_present_context_t *) user_context;
-  RAY_CHECK(ctx->data_size == data_size);
-  RAY_CHECK(strcmp(subscribe_object_present_str, ctx->teststr) == 0);
-  subscribe_object_present_succeeded = 1;
-  RAY_CHECK(manager_vector.size() == 1);
-}
-
-void fatal_fail_callback(UniqueID id, void *user_context, void *user_data) {
-  /* This function should never be called. */
-  RAY_CHECK(0);
-}
-
-TEST subscribe_object_present_test(void) {
-  int64_t data_size = 0xF1F0;
-  subscribe_object_present_context_t myctx = {subscribe_object_present_str,
-                                              data_size};
-
-  g_loop = event_loop_create();
-  /* Construct the arguments to db_connect. */
-  std::vector<std::string> db_connect_args;
-  db_connect_args.push_back("manager_address");
-  db_connect_args.push_back("127.0.0.1:11236");
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", db_connect_args);
-  db_attach(db, g_loop, false);
-  UniqueID id = UniqueID::from_random();
-  RetryInfo retry = {
-      .num_retries = 0, .timeout = 100, .fail_callback = fatal_fail_callback,
-  };
-  object_table_add(db, id, data_size, (unsigned char *) NIL_DIGEST, &retry,
-                   NULL, NULL);
-  object_table_subscribe_to_notifications(
-      db, false, subscribe_object_present_object_available_callback,
-      (void *) &myctx, &retry, NULL, (void *) db);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* Run the event loop to create do the add and subscribe. */
-  event_loop_run(g_loop);
-
-  ObjectID object_ids[1] = {id};
-  object_table_request_notifications(db, 1, object_ids, &retry);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* Run the event loop to do the request notifications. */
-  event_loop_run(g_loop);
-
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(subscribe_object_present_succeeded == 1);
-  PASS();
-}
-
-/* Test if subscribe is not called if object is not present. */
-
-const char *subscribe_object_not_present_context =
-    "subscribe_object_not_present";
-
-void subscribe_object_not_present_object_available_callback(
-    ObjectID object_id,
-    int64_t data_size,
-    const std::vector<DBClientID> &manager_vector,
-    void *user_context) {
-  /* This should not be called. */
-  RAY_CHECK(0);
-}
-
-TEST subscribe_object_not_present_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  UniqueID id = UniqueID::from_random();
-  RetryInfo retry = {
-      .num_retries = 0, .timeout = 100, .fail_callback = NULL,
-  };
-  object_table_subscribe_to_notifications(
-      db, false, subscribe_object_not_present_object_available_callback,
-      (void *) subscribe_object_not_present_context, &retry, NULL, (void *) db);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* Run the event loop to do the subscribe. */
-  event_loop_run(g_loop);
-
-  ObjectID object_ids[1] = {id};
-  object_table_request_notifications(db, 1, object_ids, &retry);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* Run the event loop to do the request notifications. */
-  event_loop_run(g_loop);
-
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  PASS();
-}
-
-/* Test if subscribe is called if object becomes available later. */
-
-const char *subscribe_object_available_later_context =
-    "subscribe_object_available_later";
-int subscribe_object_available_later_succeeded = 0;
-
-void subscribe_object_available_later_object_available_callback(
-    ObjectID object_id,
-    int64_t data_size,
-    const std::vector<DBClientID> &manager_vector,
-    void *user_context) {
-  subscribe_object_present_context_t *myctx =
-      (subscribe_object_present_context_t *) user_context;
-  RAY_CHECK(myctx->data_size == data_size);
-  RAY_CHECK(strcmp(myctx->teststr, subscribe_object_available_later_context) ==
-            0);
-  /* Make sure the callback is only called once. */
-  subscribe_object_available_later_succeeded += 1;
-  RAY_CHECK(manager_vector.size() == 1);
-}
-
-TEST subscribe_object_available_later_test(void) {
-  int64_t data_size = 0xF1F0;
-  subscribe_object_present_context_t *myctx =
-      (subscribe_object_present_context_t *) malloc(
-          sizeof(subscribe_object_present_context_t));
-  myctx->teststr = subscribe_object_available_later_context;
-  myctx->data_size = data_size;
-
-  g_loop = event_loop_create();
-  /* Construct the arguments to db_connect. */
-  std::vector<std::string> db_connect_args;
-  db_connect_args.push_back("manager_address");
-  db_connect_args.push_back("127.0.0.1:11236");
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", db_connect_args);
-  db_attach(db, g_loop, false);
-  UniqueID id = UniqueID::from_random();
-  RetryInfo retry = {
-      .num_retries = 0, .timeout = 100, .fail_callback = NULL,
-  };
-  object_table_subscribe_to_notifications(
-      db, false, subscribe_object_available_later_object_available_callback,
-      (void *) myctx, &retry, NULL, (void *) db);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* Run the event loop to do the subscribe. */
-  event_loop_run(g_loop);
-
-  ObjectID object_ids[1] = {id};
-  object_table_request_notifications(db, 1, object_ids, &retry);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* Run the event loop to do the request notifications. */
-  event_loop_run(g_loop);
-
-  ASSERT_EQ(subscribe_object_available_later_succeeded, 0);
-  object_table_add(db, id, data_size, (unsigned char *) NIL_DIGEST, &retry,
-                   NULL, NULL);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* Run the event loop to do the object table add. */
-  event_loop_run(g_loop);
-
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT_EQ(subscribe_object_available_later_succeeded, 1);
-  /* Reset the global variable before exiting this unit test. */
-  subscribe_object_available_later_succeeded = 0;
-  free(myctx);
-  PASS();
-}
-
-TEST subscribe_object_available_subscribe_all(void) {
-  int64_t data_size = 0xF1F0;
-  subscribe_object_present_context_t myctx = {
-      subscribe_object_available_later_context, data_size};
-  g_loop = event_loop_create();
-  /* Construct the arguments to db_connect. */
-  std::vector<std::string> db_connect_args;
-  db_connect_args.push_back("manager_address");
-  db_connect_args.push_back("127.0.0.1:11236");
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", db_connect_args);
-  db_attach(db, g_loop, false);
-  UniqueID id = UniqueID::from_random();
-  RetryInfo retry = {
-      .num_retries = 0, .timeout = 100, .fail_callback = NULL,
-  };
-  object_table_subscribe_to_notifications(
-      db, true, subscribe_object_available_later_object_available_callback,
-      (void *) &myctx, &retry, NULL, (void *) db);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* Run the event loop to do the subscribe. */
-  event_loop_run(g_loop);
-
-  /* At this point we don't expect any object notifications received. */
-  ASSERT_EQ(subscribe_object_available_later_succeeded, 0);
-  object_table_add(db, id, data_size, (unsigned char *) NIL_DIGEST, &retry,
-                   NULL, NULL);
-  /* Install handler to terminate event loop after 750ms. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* Run the event loop to do the object table add. */
-  event_loop_run(g_loop);
-  /* At this point we assume that object table add completed. */
-
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  /* Assert that the object table add completed and notification callback fired.
-   */
-  printf("subscribe_all object info test: callback fired: %d times\n",
-         subscribe_object_available_later_succeeded);
-  fflush(stdout);
-  ASSERT_EQ(subscribe_object_available_later_succeeded, 1);
-  /* Reset the global variable before exiting this unit test. */
-  subscribe_object_available_later_succeeded = 0;
-  PASS();
-}
-
-SUITE(object_table_tests) {
-  RUN_REDIS_TEST(new_object_test);
-  RUN_REDIS_TEST(new_object_no_task_test);
-  // RUN_REDIS_TEST(lookup_timeout_test);
-  // RUN_REDIS_TEST(add_timeout_test);
-  // RUN_REDIS_TEST(subscribe_timeout_test);
-  RUN_REDIS_TEST(add_lookup_test);
-  RUN_REDIS_TEST(add_remove_lookup_test);
-  // RUN_REDIS_TEST(lookup_late_test);
-  // RUN_REDIS_TEST(add_late_test);
-  // RUN_REDIS_TEST(subscribe_late_test);
-  RUN_REDIS_TEST(subscribe_success_test);
-  RUN_REDIS_TEST(subscribe_object_not_present_test);
-  RUN_REDIS_TEST(subscribe_object_available_later_test);
-  RUN_REDIS_TEST(subscribe_object_available_subscribe_all);
-}
-
-GREATEST_MAIN_DEFS();
-
-int main(int argc, char **argv) {
-  g_task_builder = make_task_builder();
-  GREATEST_MAIN_BEGIN();
-  RUN_SUITE(object_table_tests);
-  GREATEST_MAIN_END();
-}
diff --git a/src/common/test/redis_tests.cc b/src/common/test/redis_tests.cc
deleted file mode 100644
index 7db7ae2ee26e9..0000000000000
--- a/src/common/test/redis_tests.cc
+++ /dev/null
@@ -1,238 +0,0 @@
-#include "greatest.h"
-
-#include <assert.h>
-#include <unistd.h>
-
-#include <vector>
-
-#include "event_loop.h"
-#include "state/db.h"
-#include "state/redis.h"
-#include "io.h"
-#include "logging.h"
-#include "test_common.h"
-
-SUITE(redis_tests);
-
-const char *test_set_format = "SET %s %s";
-const char *test_get_format = "GET %s";
-const char *test_key = "foo";
-const char *test_value = "bar";
-std::vector<int> connections;
-
-void write_formatted_log_message(int socket_fd, const char *format, ...) {
-  va_list ap;
-
-  /* Get cmd size */
-  va_start(ap, format);
-  size_t cmd_size = vsnprintf(nullptr, 0, format, ap) + 1;
-  va_end(ap);
-
-  /* Print va to cmd */
-  char cmd[cmd_size];
-  va_start(ap, format);
-  vsnprintf(cmd, cmd_size, format, ap);
-  va_end(ap);
-
-  write_log_message(socket_fd, cmd);
-}
-
-int async_redis_socket_test_callback_called = 0;
-
-void async_redis_socket_test_callback(redisAsyncContext *ac,
-                                      void *r,
-                                      void *privdata) {
-  async_redis_socket_test_callback_called = 1;
-  redisContext *context = redisConnect("127.0.0.1", 6379);
-  redisReply *reply =
-      (redisReply *) redisCommand(context, test_get_format, test_key);
-  redisFree(context);
-  RAY_CHECK(reply != NULL);
-  if (strcmp(reply->str, test_value)) {
-    freeReplyObject(reply);
-    RAY_CHECK(0);
-  }
-  freeReplyObject(reply);
-}
-
-TEST redis_socket_test(void) {
-  const char *socket_pathname = "/tmp/redis-test-socket";
-  redisContext *context = redisConnect("127.0.0.1", 6379);
-  ASSERT(context != NULL);
-  int socket_fd = bind_ipc_sock(socket_pathname, true);
-  ASSERT(socket_fd >= 0);
-
-  int client_fd = connect_ipc_sock(socket_pathname);
-  ASSERT(client_fd >= 0);
-  write_formatted_log_message(client_fd, test_set_format, test_key, test_value);
-
-  int server_fd = accept_client(socket_fd);
-  char *cmd = read_log_message(server_fd);
-  close(client_fd);
-  close(server_fd);
-  close(socket_fd);
-  unlink(socket_pathname);
-
-  redisReply *reply = (redisReply *) redisCommand(context, cmd, 0, 0);
-  freeReplyObject(reply);
-  reply = (redisReply *) redisCommand(context, "GET %s", test_key);
-  ASSERT(reply != NULL);
-  ASSERT_STR_EQ(reply->str, test_value);
-  freeReplyObject(reply);
-
-  free(cmd);
-  redisFree(context);
-  PASS();
-}
-
-void redis_read_callback(event_loop *loop, int fd, void *context, int events) {
-  DBHandle *db = (DBHandle *) context;
-  char *cmd = read_log_message(fd);
-  redisAsyncCommand(db->context, async_redis_socket_test_callback, NULL, cmd);
-  free(cmd);
-}
-
-void redis_accept_callback(event_loop *loop,
-                           int socket_fd,
-                           void *context,
-                           int events) {
-  int accept_fd = accept_client(socket_fd);
-  RAY_CHECK(accept_fd >= 0);
-  connections.push_back(accept_fd);
-  event_loop_add_file(loop, accept_fd, EVENT_LOOP_READ, redis_read_callback,
-                      context);
-}
-
-int timeout_handler(event_loop *loop, timer_id timer_id, void *context) {
-  event_loop_stop(loop);
-  return EVENT_LOOP_TIMER_DONE;
-}
-
-TEST async_redis_socket_test(void) {
-  event_loop *loop = event_loop_create();
-
-  /* Start IPC channel. */
-  const char *socket_pathname = "/tmp/async-redis-test-socket";
-  int socket_fd = bind_ipc_sock(socket_pathname, true);
-  ASSERT(socket_fd >= 0);
-  connections.push_back(socket_fd);
-
-  /* Start connection to Redis. */
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "test_process",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, loop, false);
-
-  /* Send a command to the Redis process. */
-  int client_fd = connect_ipc_sock(socket_pathname);
-  ASSERT(client_fd >= 0);
-  connections.push_back(client_fd);
-  write_formatted_log_message(client_fd, test_set_format, test_key, test_value);
-
-  event_loop_add_file(loop, client_fd, EVENT_LOOP_READ, redis_read_callback,
-                      db);
-  event_loop_add_file(loop, socket_fd, EVENT_LOOP_READ, redis_accept_callback,
-                      db);
-  event_loop_add_timer(loop, 100, timeout_handler, NULL);
-  event_loop_run(loop);
-
-  ASSERT(async_redis_socket_test_callback_called);
-
-  db_disconnect(db);
-  event_loop_destroy(loop);
-
-  for (int const &p : connections) {
-    close(p);
-  }
-  unlink(socket_pathname);
-  connections.clear();
-  PASS();
-}
-
-int logging_test_callback_called = 0;
-
-void logging_test_callback(redisAsyncContext *ac, void *r, void *privdata) {
-  logging_test_callback_called = 1;
-  redisContext *context = redisConnect("127.0.0.1", 6379);
-  redisReply *reply = (redisReply *) redisCommand(context, "KEYS %s", "log:*");
-  redisFree(context);
-  RAY_CHECK(reply != NULL);
-  RAY_CHECK(reply->elements > 0);
-  freeReplyObject(reply);
-}
-
-void logging_read_callback(event_loop *loop,
-                           int fd,
-                           void *context,
-                           int events) {
-  DBHandle *conn = (DBHandle *) context;
-  char *cmd = read_log_message(fd);
-  redisAsyncCommand(conn->context, logging_test_callback, NULL, cmd,
-                    (char *) conn->client.data(), sizeof(conn->client));
-  free(cmd);
-}
-
-void logging_accept_callback(event_loop *loop,
-                             int socket_fd,
-                             void *context,
-                             int events) {
-  int accept_fd = accept_client(socket_fd);
-  RAY_CHECK(accept_fd >= 0);
-  connections.push_back(accept_fd);
-  event_loop_add_file(loop, accept_fd, EVENT_LOOP_READ, logging_read_callback,
-                      context);
-}
-
-TEST logging_test(void) {
-  event_loop *loop = event_loop_create();
-
-  /* Start IPC channel. */
-  const char *socket_pathname = "/tmp/logging-test-socket";
-  int socket_fd = bind_ipc_sock(socket_pathname, true);
-  ASSERT(socket_fd >= 0);
-  connections.push_back(socket_fd);
-
-  /* Start connection to Redis. */
-  DBHandle *conn = db_connect(std::string("127.0.0.1"), 6379, "test_process",
-                              "127.0.0.1", std::vector<std::string>());
-  db_attach(conn, loop, false);
-
-  /* Send a command to the Redis process. */
-  int client_fd = connect_ipc_sock(socket_pathname);
-  ASSERT(client_fd >= 0);
-  connections.push_back(client_fd);
-  RayLogger *logger = RayLogger_init("worker", RAY_LOG_INFO, 0, &client_fd);
-  RayLogger_log(logger, RAY_LOG_INFO, "TEST", "Message");
-
-  event_loop_add_file(loop, socket_fd, EVENT_LOOP_READ, logging_accept_callback,
-                      conn);
-  event_loop_add_file(loop, client_fd, EVENT_LOOP_READ, logging_read_callback,
-                      conn);
-  event_loop_add_timer(loop, 100, timeout_handler, NULL);
-  event_loop_run(loop);
-
-  ASSERT(logging_test_callback_called);
-
-  RayLogger_free(logger);
-  db_disconnect(conn);
-  event_loop_destroy(loop);
-  for (int const &p : connections) {
-    close(p);
-  }
-  unlink(socket_pathname);
-  connections.clear();
-  PASS();
-}
-
-SUITE(redis_tests) {
-  RUN_REDIS_TEST(redis_socket_test);
-  RUN_REDIS_TEST(async_redis_socket_test);
-  RUN_REDIS_TEST(logging_test);
-}
-
-GREATEST_MAIN_DEFS();
-
-int main(int argc, char **argv) {
-  GREATEST_MAIN_BEGIN();
-  RUN_SUITE(redis_tests);
-  GREATEST_MAIN_END();
-}
diff --git a/src/common/test/run_tests.sh b/src/common/test/run_tests.sh
deleted file mode 100644
index 5ccb1e3f92ffa..0000000000000
--- a/src/common/test/run_tests.sh
+++ /dev/null
@@ -1,43 +0,0 @@
-#!/usr/bin/env bash
-
-# This needs to be run in the build tree, which is normally ray/build
-
-# Cause the script to exit if a single command fails.
-set -ex
-
-LaunchRedis() {
-    port=$1
-    if [[ "${RAY_USE_NEW_GCS}" = "on" ]]; then
-        ./src/credis/redis/src/redis-server \
-            --loglevel warning \
-            --loadmodule ./src/credis/build/src/libmember.so \
-            --loadmodule ./src/common/redis_module/libray_redis_module.so \
-            --port $port &
-    else
-        ./src/common/thirdparty/redis/src/redis-server \
-            --loglevel warning \
-            --loadmodule ./src/common/redis_module/libray_redis_module.so \
-            --port $port &
-    fi
-    sleep 1s
-}
-
-
-# Start the Redis shards.
-LaunchRedis 6379
-LaunchRedis 6380
-# Register the shard location with the primary shard.
-./src/common/thirdparty/redis/src/redis-cli set NumRedisShards 1
-./src/common/thirdparty/redis/src/redis-cli rpush RedisShards 127.0.0.1:6380
-
-if [ -z "$RAY_USE_NEW_GCS" ]; then
-  ./src/common/db_tests
-  ./src/common/io_tests
-  ./src/common/task_tests
-  ./src/common/redis_tests
-  ./src/common/task_table_tests
-  ./src/common/object_table_tests
-fi
-
-./src/common/thirdparty/redis/src/redis-cli -p 6379 shutdown
-./src/common/thirdparty/redis/src/redis-cli -p 6380 shutdown
diff --git a/src/common/test/run_valgrind.sh b/src/common/test/run_valgrind.sh
deleted file mode 100644
index 418a91366e132..0000000000000
--- a/src/common/test/run_valgrind.sh
+++ /dev/null
@@ -1,27 +0,0 @@
-#!/usr/bin/env bash
-
-# This needs to be run in the build tree, which is normally ray/build
-
-set -x
-
-# Cause the script to exit if a single command fails.
-set -e
-
-if [ -z "$RAY_USE_NEW_GCS" ]; then
-    # Start the Redis shards.
-    ./src/common/thirdparty/redis/src/redis-server --loglevel warning --loadmodule ./src/common/redis_module/libray_redis_module.so --port 6379 &
-    ./src/common/thirdparty/redis/src/redis-server --loglevel warning --loadmodule ./src/common/redis_module/libray_redis_module.so --port 6380 &
-    sleep 1s
-    # Register the shard location with the primary shard.
-    ./src/common/thirdparty/redis/src/redis-cli set NumRedisShards 1
-    ./src/common/thirdparty/redis/src/redis-cli rpush RedisShards 127.0.0.1:6380
-
-  valgrind --track-origins=yes --leak-check=full --show-leak-kinds=all --leak-check-heuristics=stdstring --error-exitcode=1 ./src/common/db_tests
-  valgrind --track-origins=yes --leak-check=full --show-leak-kinds=all --leak-check-heuristics=stdstring --error-exitcode=1 ./src/common/io_tests
-  valgrind --track-origins=yes --leak-check=full --show-leak-kinds=all --leak-check-heuristics=stdstring --error-exitcode=1 ./src/common/task_tests
-  valgrind --track-origins=yes --leak-check=full --show-leak-kinds=all --leak-check-heuristics=stdstring --error-exitcode=1 ./src/common/redis_tests
-  valgrind --track-origins=yes --leak-check=full --show-leak-kinds=all --leak-check-heuristics=stdstring --error-exitcode=1 ./src/common/task_table_tests
-  valgrind --track-origins=yes --leak-check=full --show-leak-kinds=all --leak-check-heuristics=stdstring --error-exitcode=1 ./src/common/object_table_tests
-  ./src/common/thirdparty/redis/src/redis-cli shutdown
-  ./src/common/thirdparty/redis/src/redis-cli -p 6380 shutdown
-fi
diff --git a/src/common/test/task_table_tests.cc b/src/common/test/task_table_tests.cc
deleted file mode 100644
index f94aca3b132c4..0000000000000
--- a/src/common/test/task_table_tests.cc
+++ /dev/null
@@ -1,460 +0,0 @@
-#include "greatest.h"
-
-#include "event_loop.h"
-#include "example_task.h"
-#include "test_common.h"
-#include "common.h"
-#include "state/object_table.h"
-#include "state/redis.h"
-
-#include <unistd.h>
-#include <ae.h>
-
-SUITE(task_table_tests);
-
-event_loop *g_loop;
-TaskBuilder *g_task_builder = NULL;
-
-/* ==== Test operations in non-failure scenario ==== */
-
-/* === A lookup of a task not in the table === */
-
-TaskID lookup_nil_id;
-int lookup_nil_success = 0;
-const char *lookup_nil_context = "lookup_nil";
-
-void lookup_nil_fail_callback(UniqueID id,
-                              void *user_context,
-                              void *user_data) {
-  /* The fail callback should not be called. */
-  RAY_CHECK(0);
-}
-
-void lookup_nil_success_callback(Task *task, void *context) {
-  lookup_nil_success = 1;
-  RAY_CHECK(task == NULL);
-  RAY_CHECK(context == (void *) lookup_nil_context);
-  event_loop_stop(g_loop);
-}
-
-TEST lookup_nil_test(void) {
-  lookup_nil_id = TaskID::from_random();
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 1000,
-      .fail_callback = lookup_nil_fail_callback,
-  };
-  task_table_get_task(db, lookup_nil_id, &retry, lookup_nil_success_callback,
-                      (void *) lookup_nil_context);
-  /* Disconnect the database to see if the lookup times out. */
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(lookup_nil_success);
-  PASS();
-}
-
-/* === A lookup of a task after it's added returns the same spec === */
-
-int add_success = 0;
-int lookup_success = 0;
-Task *add_lookup_task;
-const char *add_lookup_context = "add_lookup";
-
-void add_lookup_fail_callback(UniqueID id,
-                              void *user_context,
-                              void *user_data) {
-  /* The fail callback should not be called. */
-  RAY_CHECK(0);
-}
-
-void lookup_success_callback(Task *task, void *context) {
-  lookup_success = 1;
-  RAY_CHECK(Task_equals(task, add_lookup_task));
-  event_loop_stop(g_loop);
-}
-
-void add_success_callback(TaskID task_id, void *context) {
-  add_success = 1;
-  RAY_CHECK(TaskID_equal(task_id, Task_task_id(add_lookup_task)));
-
-  DBHandle *db = (DBHandle *) context;
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 1000,
-      .fail_callback = add_lookup_fail_callback,
-  };
-  task_table_get_task(db, task_id, &retry, lookup_success_callback,
-                      (void *) add_lookup_context);
-}
-
-void subscribe_success_callback(TaskID task_id, void *context) {
-  DBHandle *db = (DBHandle *) context;
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 1000,
-      .fail_callback = add_lookup_fail_callback,
-  };
-  task_table_add_task(db, Task_copy(add_lookup_task), &retry,
-                      add_success_callback, (void *) db);
-}
-
-TEST add_lookup_test(void) {
-  add_lookup_task = example_task(1, 1, TaskStatus::WAITING);
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 1000,
-      .fail_callback = add_lookup_fail_callback,
-  };
-  /* Wait for subscription to succeed before adding the task. */
-  task_table_subscribe(db, UniqueID::nil(), TaskStatus::WAITING, NULL, NULL,
-                       &retry, subscribe_success_callback, (void *) db);
-  /* Disconnect the database to see if the lookup times out. */
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(add_success);
-  ASSERT(lookup_success);
-  PASS();
-}
-
-/* ==== Test if operations time out correctly ==== */
-
-/* === Test subscribe timeout === */
-
-const char *subscribe_timeout_context = "subscribe_timeout";
-int subscribe_failed = 0;
-
-void subscribe_done_callback(TaskID task_id, void *user_context) {
-  /* The done callback should not be called. */
-  RAY_CHECK(0);
-}
-
-void subscribe_fail_callback(UniqueID id, void *user_context, void *user_data) {
-  subscribe_failed = 1;
-  RAY_CHECK(user_context == (void *) subscribe_timeout_context);
-  event_loop_stop(g_loop);
-}
-
-TEST subscribe_timeout_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = subscribe_fail_callback,
-  };
-  task_table_subscribe(db, UniqueID::nil(), TaskStatus::WAITING, NULL, NULL,
-                       &retry, subscribe_done_callback,
-                       (void *) subscribe_timeout_context);
-  /* Disconnect the database to see if the subscribe times out. */
-  close(db->subscribe_context->c.fd);
-  for (size_t i = 0; i < db->subscribe_contexts.size(); ++i) {
-    close(db->subscribe_contexts[i]->c.fd);
-  }
-  aeProcessEvents(g_loop, AE_TIME_EVENTS);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(subscribe_failed);
-  PASS();
-}
-
-/* === Test publish timeout === */
-
-const char *publish_timeout_context = "publish_timeout";
-int publish_failed = 0;
-
-void publish_done_callback(TaskID task_id, void *user_context) {
-  /* The done callback should not be called. */
-  RAY_CHECK(0);
-}
-
-void publish_fail_callback(UniqueID id, void *user_context, void *user_data) {
-  publish_failed = 1;
-  RAY_CHECK(user_context == (void *) publish_timeout_context);
-  event_loop_stop(g_loop);
-}
-
-TEST publish_timeout_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  Task *task = example_task(1, 1, TaskStatus::WAITING);
-  RetryInfo retry = {
-      .num_retries = 5, .timeout = 100, .fail_callback = publish_fail_callback,
-  };
-  task_table_subscribe(db, UniqueID::nil(), TaskStatus::WAITING, NULL, NULL,
-                       &retry, NULL, NULL);
-  task_table_add_task(db, task, &retry, publish_done_callback,
-                      (void *) publish_timeout_context);
-  /* Disconnect the database to see if the publish times out. */
-  close(db->context->c.fd);
-  for (size_t i = 0; i < db->contexts.size(); ++i) {
-    close(db->contexts[i]->c.fd);
-  }
-  aeProcessEvents(g_loop, AE_TIME_EVENTS);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(publish_failed);
-  PASS();
-}
-
-/* ==== Test if the retry is working correctly ==== */
-
-int64_t reconnect_db_callback(event_loop *loop,
-                              int64_t timer_id,
-                              void *context) {
-  DBHandle *db = (DBHandle *) context;
-  /* Reconnect to redis. */
-  redisAsyncFree(db->subscribe_context);
-  db->subscribe_context = redisAsyncConnect("127.0.0.1", 6379);
-  db->subscribe_context->data = (void *) db;
-  for (size_t i = 0; i < db->subscribe_contexts.size(); ++i) {
-    redisAsyncFree(db->subscribe_contexts[i]);
-    db->subscribe_contexts[i] = redisAsyncConnect("127.0.0.1", 6380 + i);
-    db->subscribe_contexts[i]->data = (void *) db;
-  }
-  /* Re-attach the database to the event loop (the file descriptor changed). */
-  db_attach(db, loop, true);
-  return EVENT_LOOP_TIMER_DONE;
-}
-
-int64_t terminate_event_loop_callback(event_loop *loop,
-                                      int64_t timer_id,
-                                      void *context) {
-  event_loop_stop(loop);
-  return EVENT_LOOP_TIMER_DONE;
-}
-
-/* === Test subscribe retry === */
-
-const char *subscribe_retry_context = "subscribe_retry";
-int subscribe_retry_succeeded = 0;
-
-void subscribe_retry_done_callback(ObjectID object_id, void *user_context) {
-  RAY_CHECK(user_context == (void *) subscribe_retry_context);
-  subscribe_retry_succeeded = 1;
-}
-
-void subscribe_retry_fail_callback(UniqueID id,
-                                   void *user_context,
-                                   void *user_data) {
-  /* The fail callback should not be called. */
-  RAY_CHECK(0);
-}
-
-TEST subscribe_retry_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = subscribe_retry_fail_callback,
-  };
-  task_table_subscribe(db, UniqueID::nil(), TaskStatus::WAITING, NULL, NULL,
-                       &retry, subscribe_retry_done_callback,
-                       (void *) subscribe_retry_context);
-  /* Disconnect the database to see if the subscribe times out. */
-  close(db->subscribe_context->c.fd);
-  for (size_t i = 0; i < db->subscribe_contexts.size(); ++i) {
-    close(db->subscribe_contexts[i]->c.fd);
-  }
-  /* Install handler for reconnecting the database. */
-  event_loop_add_timer(g_loop, 150,
-                       (event_loop_timer_handler) reconnect_db_callback, db);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(subscribe_retry_succeeded);
-  PASS();
-}
-
-/* === Test publish retry === */
-
-const char *publish_retry_context = "publish_retry";
-int publish_retry_succeeded = 0;
-
-void publish_retry_done_callback(ObjectID object_id, void *user_context) {
-  RAY_CHECK(user_context == (void *) publish_retry_context);
-  publish_retry_succeeded = 1;
-}
-
-void publish_retry_fail_callback(UniqueID id,
-                                 void *user_context,
-                                 void *user_data) {
-  /* The fail callback should not be called. */
-  RAY_CHECK(0);
-}
-
-TEST publish_retry_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  Task *task = example_task(1, 1, TaskStatus::WAITING);
-  RetryInfo retry = {
-      .num_retries = 5,
-      .timeout = 100,
-      .fail_callback = publish_retry_fail_callback,
-  };
-  task_table_subscribe(db, UniqueID::nil(), TaskStatus::WAITING, NULL, NULL,
-                       &retry, NULL, NULL);
-  task_table_add_task(db, task, &retry, publish_retry_done_callback,
-                      (void *) publish_retry_context);
-  /* Disconnect the database to see if the publish times out. */
-  close(db->subscribe_context->c.fd);
-  for (size_t i = 0; i < db->subscribe_contexts.size(); ++i) {
-    close(db->subscribe_contexts[i]->c.fd);
-  }
-  /* Install handler for reconnecting the database. */
-  event_loop_add_timer(g_loop, 150,
-                       (event_loop_timer_handler) reconnect_db_callback, db);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(publish_retry_succeeded);
-  PASS();
-}
-
-/* ==== Test if late succeed is working correctly ==== */
-
-/* === Test subscribe late succeed === */
-
-const char *subscribe_late_context = "subscribe_late";
-int subscribe_late_failed = 0;
-
-void subscribe_late_fail_callback(UniqueID id,
-                                  void *user_context,
-                                  void *user_data) {
-  RAY_CHECK(user_context == (void *) subscribe_late_context);
-  subscribe_late_failed = 1;
-}
-
-void subscribe_late_done_callback(TaskID task_id, void *user_context) {
-  /* This function should never be called. */
-  RAY_CHECK(0);
-}
-
-TEST subscribe_late_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  RetryInfo retry = {
-      .num_retries = 0,
-      .timeout = 0,
-      .fail_callback = subscribe_late_fail_callback,
-  };
-  task_table_subscribe(db, UniqueID::nil(), TaskStatus::WAITING, NULL, NULL,
-                       &retry, subscribe_late_done_callback,
-                       (void *) subscribe_late_context);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* First process timer events to make sure the timeout is processed before
-   * anything else. */
-  aeProcessEvents(g_loop, AE_TIME_EVENTS);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(subscribe_late_failed);
-  PASS();
-}
-
-/* === Test publish late succeed === */
-
-const char *publish_late_context = "publish_late";
-int publish_late_failed = 0;
-
-void publish_late_fail_callback(UniqueID id,
-                                void *user_context,
-                                void *user_data) {
-  RAY_CHECK(user_context == (void *) publish_late_context);
-  publish_late_failed = 1;
-}
-
-void publish_late_done_callback(TaskID task_id, void *user_context) {
-  /* This function should never be called. */
-  RAY_CHECK(0);
-}
-
-TEST publish_late_test(void) {
-  g_loop = event_loop_create();
-  DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                            "127.0.0.1", std::vector<std::string>());
-  db_attach(db, g_loop, false);
-  Task *task = example_task(1, 1, TaskStatus::WAITING);
-  RetryInfo retry = {
-      .num_retries = 0,
-      .timeout = 0,
-      .fail_callback = publish_late_fail_callback,
-  };
-  task_table_subscribe(db, UniqueID::nil(), TaskStatus::WAITING, NULL, NULL,
-                       NULL, NULL, NULL);
-  task_table_add_task(db, task, &retry, publish_late_done_callback,
-                      (void *) publish_late_context);
-  /* Install handler for terminating the event loop. */
-  event_loop_add_timer(g_loop, 750,
-                       (event_loop_timer_handler) terminate_event_loop_callback,
-                       NULL);
-  /* First process timer events to make sure the timeout is processed before
-   * anything else. */
-  aeProcessEvents(g_loop, AE_TIME_EVENTS);
-  event_loop_run(g_loop);
-  db_disconnect(db);
-  destroy_outstanding_callbacks(g_loop);
-  event_loop_destroy(g_loop);
-  ASSERT(publish_late_failed);
-  PASS();
-}
-
-SUITE(task_table_tests) {
-  RUN_REDIS_TEST(lookup_nil_test);
-  RUN_REDIS_TEST(add_lookup_test);
-  // RUN_REDIS_TEST(subscribe_timeout_test);
-  // RUN_REDIS_TEST(publish_timeout_test);
-  // RUN_REDIS_TEST(subscribe_retry_test);
-  // RUN_REDIS_TEST(publish_retry_test);
-  // RUN_REDIS_TEST(subscribe_late_test);
-  // RUN_REDIS_TEST(publish_late_test);
-}
-
-GREATEST_MAIN_DEFS();
-
-int main(int argc, char **argv) {
-  g_task_builder = make_task_builder();
-  GREATEST_MAIN_BEGIN();
-  RUN_SUITE(task_table_tests);
-  GREATEST_MAIN_END();
-}
diff --git a/src/common/test/task_tests.cc b/src/common/test/task_tests.cc
deleted file mode 100644
index 2277912e7dec0..0000000000000
--- a/src/common/test/task_tests.cc
+++ /dev/null
@@ -1,212 +0,0 @@
-#include "greatest.h"
-
-#include <unistd.h>
-#include <sys/types.h>
-#include <sys/socket.h>
-
-#include "common.h"
-#include "test_common.h"
-#include "task.h"
-#include "io.h"
-
-SUITE(task_tests);
-
-TEST task_test(void) {
-  TaskID parent_task_id = TaskID::from_random();
-  FunctionID func_id = FunctionID::from_random();
-  TaskBuilder *builder = make_task_builder();
-  TaskSpec_start_construct(builder, DriverID::nil(), parent_task_id, 0,
-                           ActorID::nil(), ObjectID::nil(), ActorID::nil(),
-                           ActorID::nil(), 0, false, func_id, 2);
-
-  UniqueID arg1 = UniqueID::from_random();
-  TaskSpec_args_add_ref(builder, &arg1, 1);
-  TaskSpec_args_add_val(builder, (uint8_t *) "hello", 5);
-  UniqueID arg2 = UniqueID::from_random();
-  TaskSpec_args_add_ref(builder, &arg2, 1);
-  TaskSpec_args_add_val(builder, (uint8_t *) "world", 5);
-  /* Finish constructing the spec. This constructs the task ID and the
-   * return IDs. */
-  int64_t size;
-  TaskSpec *spec = TaskSpec_finish_construct(builder, &size);
-
-  /* Check that the spec was constructed as expected. */
-  ASSERT(TaskSpec_num_args(spec) == 4);
-  ASSERT(TaskSpec_num_returns(spec) == 2);
-  ASSERT(FunctionID_equal(TaskSpec_function(spec), func_id));
-  ASSERT(TaskSpec_arg_id(spec, 0, 0) == arg1);
-  ASSERT(memcmp(TaskSpec_arg_val(spec, 1), (uint8_t *) "hello",
-                TaskSpec_arg_length(spec, 1)) == 0);
-  ASSERT(TaskSpec_arg_id(spec, 2, 0) == arg2);
-  ASSERT(memcmp(TaskSpec_arg_val(spec, 3), (uint8_t *) "world",
-                TaskSpec_arg_length(spec, 3)) == 0);
-
-  TaskSpec_free(spec);
-  free_task_builder(builder);
-  PASS();
-}
-
-TEST deterministic_ids_test(void) {
-  TaskBuilder *builder = make_task_builder();
-  /* Define the inputs to the task construction. */
-  TaskID parent_task_id = TaskID::from_random();
-  FunctionID func_id = FunctionID::from_random();
-  UniqueID arg1 = UniqueID::from_random();
-  uint8_t *arg2 = (uint8_t *) "hello world";
-
-  /* Construct a first task. */
-  TaskSpec_start_construct(builder, DriverID::nil(), parent_task_id, 0,
-                           ActorID::nil(), ObjectID::nil(), ActorID::nil(),
-                           ActorID::nil(), 0, false, func_id, 3);
-  TaskSpec_args_add_ref(builder, &arg1, 1);
-  TaskSpec_args_add_val(builder, arg2, 11);
-  int64_t size1;
-  TaskSpec *spec1 = TaskSpec_finish_construct(builder, &size1);
-
-  /* Construct a second identical task. */
-  TaskSpec_start_construct(builder, DriverID::nil(), parent_task_id, 0,
-                           ActorID::nil(), ObjectID::nil(), ActorID::nil(),
-                           ActorID::nil(), 0, false, func_id, 3);
-  TaskSpec_args_add_ref(builder, &arg1, 1);
-  TaskSpec_args_add_val(builder, arg2, 11);
-  int64_t size2;
-  TaskSpec *spec2 = TaskSpec_finish_construct(builder, &size2);
-
-  /* Check that these tasks have the same task IDs and the same return IDs. */
-  ASSERT(TaskID_equal(TaskSpec_task_id(spec1), TaskSpec_task_id(spec2)));
-  ASSERT(TaskSpec_return(spec1, 0) == TaskSpec_return(spec2, 0));
-  ASSERT(TaskSpec_return(spec1, 1) == TaskSpec_return(spec2, 1));
-  ASSERT(TaskSpec_return(spec1, 2) == TaskSpec_return(spec2, 2));
-  /* Check that the return IDs are all distinct. */
-  ASSERT(!(TaskSpec_return(spec1, 0) == TaskSpec_return(spec2, 1)));
-  ASSERT(!(TaskSpec_return(spec1, 0) == TaskSpec_return(spec2, 2)));
-  ASSERT(!(TaskSpec_return(spec1, 1) == TaskSpec_return(spec2, 2)));
-
-  /* Create more tasks that are only mildly different. */
-
-  /* Construct a task with a different parent task ID. */
-  TaskSpec_start_construct(builder, DriverID::nil(), TaskID::from_random(), 0,
-                           ActorID::nil(), ObjectID::nil(), ActorID::nil(),
-                           ActorID::nil(), 0, false, func_id, 3);
-  TaskSpec_args_add_ref(builder, &arg1, 1);
-  TaskSpec_args_add_val(builder, arg2, 11);
-  int64_t size3;
-  TaskSpec *spec3 = TaskSpec_finish_construct(builder, &size3);
-
-  /* Construct a task with a different parent counter. */
-  TaskSpec_start_construct(builder, DriverID::nil(), parent_task_id, 1,
-                           ActorID::nil(), ObjectID::nil(), ActorID::nil(),
-                           ActorID::nil(), 0, false, func_id, 3);
-  TaskSpec_args_add_ref(builder, &arg1, 1);
-  TaskSpec_args_add_val(builder, arg2, 11);
-  int64_t size4;
-  TaskSpec *spec4 = TaskSpec_finish_construct(builder, &size4);
-
-  /* Construct a task with a different function ID. */
-  TaskSpec_start_construct(builder, DriverID::nil(), parent_task_id, 0,
-                           ActorID::nil(), ObjectID::nil(), ActorID::nil(),
-                           ActorID::nil(), 0, false, FunctionID::from_random(),
-                           3);
-  TaskSpec_args_add_ref(builder, &arg1, 1);
-  TaskSpec_args_add_val(builder, arg2, 11);
-  int64_t size5;
-  TaskSpec *spec5 = TaskSpec_finish_construct(builder, &size5);
-
-  /* Construct a task with a different object ID argument. */
-  TaskSpec_start_construct(builder, DriverID::nil(), parent_task_id, 0,
-                           ActorID::nil(), ObjectID::nil(), ActorID::nil(),
-                           ActorID::nil(), 0, false, func_id, 3);
-  ObjectID object_id = ObjectID::from_random();
-  TaskSpec_args_add_ref(builder, &object_id, 1);
-  TaskSpec_args_add_val(builder, arg2, 11);
-  int64_t size6;
-  TaskSpec *spec6 = TaskSpec_finish_construct(builder, &size6);
-
-  /* Construct a task with a different value argument. */
-  TaskSpec_start_construct(builder, DriverID::nil(), parent_task_id, 0,
-                           ActorID::nil(), ObjectID::nil(), ActorID::nil(),
-                           ActorID::nil(), 0, false, func_id, 3);
-  TaskSpec_args_add_ref(builder, &arg1, 1);
-  TaskSpec_args_add_val(builder, (uint8_t *) "hello_world", 11);
-  int64_t size7;
-  TaskSpec *spec7 = TaskSpec_finish_construct(builder, &size7);
-
-  /* Check that the task IDs are all distinct from the original. */
-  ASSERT(!TaskID_equal(TaskSpec_task_id(spec1), TaskSpec_task_id(spec3)));
-  ASSERT(!TaskID_equal(TaskSpec_task_id(spec1), TaskSpec_task_id(spec4)));
-  ASSERT(!TaskID_equal(TaskSpec_task_id(spec1), TaskSpec_task_id(spec5)));
-  ASSERT(!TaskID_equal(TaskSpec_task_id(spec1), TaskSpec_task_id(spec6)));
-  ASSERT(!TaskID_equal(TaskSpec_task_id(spec1), TaskSpec_task_id(spec7)));
-
-  /* Check that the return object IDs are distinct from the originals. */
-  TaskSpec *specs[6] = {spec1, spec3, spec4, spec5, spec6, spec7};
-  for (int task_index1 = 0; task_index1 < 6; ++task_index1) {
-    for (int return_index1 = 0; return_index1 < 3; ++return_index1) {
-      for (int task_index2 = 0; task_index2 < 6; ++task_index2) {
-        for (int return_index2 = 0; return_index2 < 3; ++return_index2) {
-          if (task_index1 != task_index2 && return_index1 != return_index2) {
-            ASSERT(!(TaskSpec_return(specs[task_index1], return_index1) ==
-                     TaskSpec_return(specs[task_index2], return_index2)));
-          }
-        }
-      }
-    }
-  }
-
-  TaskSpec_free(spec1);
-  TaskSpec_free(spec2);
-  TaskSpec_free(spec3);
-  TaskSpec_free(spec4);
-  TaskSpec_free(spec5);
-  TaskSpec_free(spec6);
-  TaskSpec_free(spec7);
-  free_task_builder(builder);
-  PASS();
-}
-
-TEST send_task(void) {
-  TaskBuilder *builder = make_task_builder();
-  TaskID parent_task_id = TaskID::from_random();
-  FunctionID func_id = FunctionID::from_random();
-  TaskSpec_start_construct(builder, DriverID::nil(), parent_task_id, 0,
-                           ActorID::nil(), ObjectID::nil(), ActorID::nil(),
-                           ActorID::nil(), 0, false, func_id, 2);
-  ObjectID object_id = ObjectID::from_random();
-  TaskSpec_args_add_ref(builder, &object_id, 1);
-  TaskSpec_args_add_val(builder, (uint8_t *) "Hello", 5);
-  TaskSpec_args_add_val(builder, (uint8_t *) "World", 5);
-  object_id = ObjectID::from_random();
-  TaskSpec_args_add_ref(builder, &object_id, 1);
-  int64_t size;
-  TaskSpec *spec = TaskSpec_finish_construct(builder, &size);
-  int fd[2];
-  socketpair(AF_UNIX, SOCK_STREAM, 0, fd);
-  write_message(fd[0], static_cast<int64_t>(CommonMessageType::SUBMIT_TASK),
-                size, (uint8_t *) spec);
-  int64_t type;
-  int64_t length;
-  uint8_t *message;
-  read_message(fd[1], &type, &length, &message);
-  TaskSpec *result = (TaskSpec *) message;
-  ASSERT(static_cast<CommonMessageType>(type) ==
-         CommonMessageType::SUBMIT_TASK);
-  ASSERT(memcmp(spec, result, size) == 0);
-  TaskSpec_free(spec);
-  free(result);
-  free_task_builder(builder);
-  PASS();
-}
-
-SUITE(task_tests) {
-  RUN_TEST(task_test);
-  RUN_TEST(deterministic_ids_test);
-  RUN_TEST(send_task);
-}
-
-GREATEST_MAIN_DEFS();
-
-int main(int argc, char **argv) {
-  GREATEST_MAIN_BEGIN();
-  RUN_SUITE(task_tests);
-  GREATEST_MAIN_END();
-}
diff --git a/src/common/test/test_common.h b/src/common/test/test_common.h
deleted file mode 100644
index 03984e6f22490..0000000000000
--- a/src/common/test/test_common.h
+++ /dev/null
@@ -1,91 +0,0 @@
-#ifndef TEST_COMMON_H
-#define TEST_COMMON_H
-
-#include <unistd.h>
-
-#include <cstdio>
-#include <string>
-#include <vector>
-
-#include "common.h"
-#include "io.h"
-#include "hiredis/hiredis.h"
-#include "state/redis.h"
-
-#ifndef _WIN32
-/* This function is actually not declared in standard POSIX, so declare it. */
-extern int usleep(useconds_t usec);
-#endif
-
-/* I/O helper methods to retry binding to sockets. */
-static inline std::string bind_ipc_sock_retry(const char *socket_name_format,
-                                              int *fd) {
-  std::string socket_name;
-  for (int num_retries = 0; num_retries < 5; ++num_retries) {
-    RAY_LOG(INFO) << "trying to find plasma socket (attempt " << num_retries
-                  << ")";
-    size_t size = std::snprintf(nullptr, 0, socket_name_format, rand()) + 1;
-    char socket_name_c_str[size];
-    std::snprintf(socket_name_c_str, size, socket_name_format, rand());
-    socket_name = std::string(socket_name_c_str);
-
-    *fd = bind_ipc_sock(socket_name.c_str(), true);
-    if (*fd < 0) {
-      /* Sleep for 100ms. */
-      usleep(100000);
-      continue;
-    }
-    break;
-  }
-  return socket_name;
-}
-
-static inline int bind_inet_sock_retry(int *fd) {
-  int port = -1;
-  for (int num_retries = 0; num_retries < 5; ++num_retries) {
-    port = 10000 + rand() % 40000;
-    *fd = bind_inet_sock(port, true);
-    if (*fd < 0) {
-      /* Sleep for 100ms. */
-      usleep(100000);
-      continue;
-    }
-    break;
-  }
-  return port;
-}
-
-/* Flush redis. */
-static inline void flushall_redis(void) {
-  /* Flush the primary shard. */
-  redisContext *context = redisConnect("127.0.0.1", 6379);
-  std::vector<std::string> db_shards_addresses;
-  std::vector<int> db_shards_ports;
-  get_redis_shards(context, db_shards_addresses, db_shards_ports);
-  freeReplyObject(redisCommand(context, "FLUSHALL"));
-  /* Readd the shard locations. */
-  freeReplyObject(redisCommand(context, "SET NumRedisShards %d",
-                               db_shards_addresses.size()));
-  for (size_t i = 0; i < db_shards_addresses.size(); ++i) {
-    freeReplyObject(redisCommand(context, "RPUSH RedisShards %s:%d",
-                                 db_shards_addresses[i].c_str(),
-                                 db_shards_ports[i]));
-  }
-  redisFree(context);
-
-  /* Flush the remaining shards. */
-  for (size_t i = 0; i < db_shards_addresses.size(); ++i) {
-    context = redisConnect(db_shards_addresses[i].c_str(), db_shards_ports[i]);
-    freeReplyObject(redisCommand(context, "FLUSHALL"));
-    redisFree(context);
-  }
-}
-
-/* Cleanup method for running tests with the greatest library.
- * Runs the test, then clears the Redis database. */
-#define RUN_REDIS_TEST(test) \
-  flushall_redis();          \
-  RUN_TEST(test);            \
-  flushall_redis();
-
-#endif /* TEST_COMMON */
diff --git a/src/common/thirdparty/download_thirdparty.bat b/src/common/thirdparty/download_thirdparty.bat
deleted file mode 100644
index 988592f83af62..0000000000000
--- a/src/common/thirdparty/download_thirdparty.bat
+++ /dev/null
@@ -1,15 +0,0 @@
-@SetLocal
-	@Echo Off
-	@PushD "%~dp0"
-		git                                                     submodule update --init --jobs="%NUMBER_OF_PROCESSORS%"
-		@If Not Exist  "python\.git" git                        clone "https://github.com/austinsc/python.git"
-		Call :GitApply "python"                                 "%CD%/patches/windows/python-pyconfig.patch"
-		Call :GitApply "redis-windows"                          "%CD%/patches/windows/redis.patch"
-	@PopD
-@EndLocal
-@GoTo :EOF
-
-:GitApply <ChangeToFolder> <Patch>
-	@REM Check if patch already applied by attempting to apply it in reverse; if not, then force-reapply it
-	git -C "%~1" apply "%~2" -R --check 2> NUL || git -C "%~1" apply "%~2" --3way 2> NUL || git -C "%~1" reset --hard && git -C "%~1" apply "%~2" --3way
-@GoTo :EOF
diff --git a/src/common/thirdparty/greatest.h b/src/common/thirdparty/greatest.h
deleted file mode 100644
index eb34ff4263ece..0000000000000
--- a/src/common/thirdparty/greatest.h
+++ /dev/null
@@ -1,1023 +0,0 @@
-/*
- * Copyright (c) 2011-2016 Scott Vokes <vokes.s@gmail.com>
- *
- * Permission to use, copy, modify, and/or distribute this software for any
- * purpose with or without fee is hereby granted, provided that the above
- * copyright notice and this permission notice appear in all copies.
- *
- * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
- * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
- * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
- * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
- * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
- * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
- * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
- */
-
-#ifndef GREATEST_H
-#define GREATEST_H
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-
-/* 1.2.1 */
-#define GREATEST_VERSION_MAJOR 1
-#define GREATEST_VERSION_MINOR 2
-#define GREATEST_VERSION_PATCH 1
-
-/* A unit testing system for C, contained in 1 file.
- * It doesn't use dynamic allocation or depend on anything
- * beyond ANSI C89.
- *
- * An up-to-date version can be found at:
- *     https://github.com/silentbicycle/greatest/
- */
-
-
-/*********************************************************************
- * Minimal test runner template
- *********************************************************************/
-#if 0
-#include "greatest.h"
-TEST foo_should_foo(void) {
-    PASS();
-}
-static void setup_cb(void *data) {
-    printf("setup callback for each test case\n");
-}
-static void teardown_cb(void *data) {
-    printf("teardown callback for each test case\n");
-}
-SUITE(suite) {
-    /* Optional setup/teardown callbacks which will be run before/after
-     * every test case. If using a test suite, they will be cleared when
-     * the suite finishes. */
-    SET_SETUP(setup_cb, voidp_to_callback_data);
-    SET_TEARDOWN(teardown_cb, voidp_to_callback_data);
-    RUN_TEST(foo_should_foo);
-}
-/* Add definitions that need to be in the test runner's main file. */
-GREATEST_MAIN_DEFS();
-/* Set up, run suite(s) of tests, report pass/fail/skip stats. */
-int run_tests(void) {
-    GREATEST_INIT();            /* init. greatest internals */
-    /* List of suites to run (if any). */
-    RUN_SUITE(suite);
-    /* Tests can also be run directly, without using test suites. */
-    RUN_TEST(foo_should_foo);
-    GREATEST_PRINT_REPORT();          /* display results */
-    return greatest_all_passed();
-}
-/* main(), for a standalone command-line test runner.
- * This replaces run_tests above, and adds command line option
- * handling and exiting with a pass/fail status. */
-int main(int argc, char **argv) {
-    GREATEST_MAIN_BEGIN();      /* init & parse command-line args */
-    RUN_SUITE(suite);
-    GREATEST_MAIN_END();        /* display results */
-}
-#endif
-/*********************************************************************/
-
-
-#include <stdlib.h>
-#include <stdio.h>
-#include <string.h>
-#include <ctype.h>
-
-/***********
- * Options *
- ***********/
-
-/* Default column width for non-verbose output. */
-#ifndef GREATEST_DEFAULT_WIDTH
-#define GREATEST_DEFAULT_WIDTH 72
-#endif
-
-/* FILE *, for test logging. */
-#ifndef GREATEST_STDOUT
-#define GREATEST_STDOUT stdout
-#endif
-
-/* Remove GREATEST_ prefix from most commonly used symbols? */
-#ifndef GREATEST_USE_ABBREVS
-#define GREATEST_USE_ABBREVS 1
-#endif
-
-/* Set to 0 to disable all use of setjmp/longjmp. */
-#ifndef GREATEST_USE_LONGJMP
-#define GREATEST_USE_LONGJMP 1
-#endif
-
-#if GREATEST_USE_LONGJMP
-#include <setjmp.h>
-#endif
-
-/* Set to 0 to disable all use of time.h / clock(). */
-#ifndef GREATEST_USE_TIME
-#define GREATEST_USE_TIME 1
-#endif
-
-#if GREATEST_USE_TIME
-#include <time.h>
-#endif
-
-/* Floating point type, for ASSERT_IN_RANGE. */
-#ifndef GREATEST_FLOAT
-#define GREATEST_FLOAT double
-#define GREATEST_FLOAT_FMT "%g"
-#endif
-
-/*********
- * Types *
- *********/
-
-/* Info for the current running suite. */
-typedef struct greatest_suite_info {
-    unsigned int tests_run;
-    unsigned int passed;
-    unsigned int failed;
-    unsigned int skipped;
-
-#if GREATEST_USE_TIME
-    /* timers, pre/post running suite and individual tests */
-    clock_t pre_suite;
-    clock_t post_suite;
-    clock_t pre_test;
-    clock_t post_test;
-#endif
-} greatest_suite_info;
-
-/* Type for a suite function. */
-typedef void (greatest_suite_cb)(void);
-
-/* Types for setup/teardown callbacks. If non-NULL, these will be run
- * and passed the pointer to their additional data. */
-typedef void (greatest_setup_cb)(void *udata);
-typedef void (greatest_teardown_cb)(void *udata);
-
-/* Type for an equality comparison between two pointers of the same type.
- * Should return non-0 if equal, otherwise 0.
- * UDATA is a closure value, passed through from ASSERT_EQUAL_T[m]. */
-typedef int greatest_equal_cb(const void *exp, const void *got, void *udata);
-
-/* Type for a callback that prints a value pointed to by T.
- * Return value has the same meaning as printf's.
- * UDATA is a closure value, passed through from ASSERT_EQUAL_T[m]. */
-typedef int greatest_printf_cb(const void *t, void *udata);
-
-/* Callbacks for an arbitrary type; needed for type-specific
- * comparisons via GREATEST_ASSERT_EQUAL_T[m].*/
-typedef struct greatest_type_info {
-    greatest_equal_cb *equal;
-    greatest_printf_cb *print;
-} greatest_type_info;
-
-typedef struct greatest_memory_cmp_env {
-    const unsigned char *exp;
-    const unsigned char *got;
-    size_t size;
-} greatest_memory_cmp_env;
-
-/* Callbacks for string and raw memory types. */
-extern greatest_type_info greatest_type_info_string;
-extern greatest_type_info greatest_type_info_memory;
-
-typedef enum {
-    GREATEST_FLAG_FIRST_FAIL = 0x01,
-    GREATEST_FLAG_LIST_ONLY = 0x02
-} greatest_flag_t;
-
-/* Struct containing all test runner state. */
-typedef struct greatest_run_info {
-    unsigned char flags;
-    unsigned char verbosity;
-    unsigned int tests_run;     /* total test count */
-
-    /* overall pass/fail/skip counts */
-    unsigned int passed;
-    unsigned int failed;
-    unsigned int skipped;
-    unsigned int assertions;
-
-    /* currently running test suite */
-    greatest_suite_info suite;
-
-    /* info to print about the most recent failure */
-    const char *fail_file;
-    unsigned int fail_line;
-    const char *msg;
-
-    /* current setup/teardown hooks and userdata */
-    greatest_setup_cb *setup;
-    void *setup_udata;
-    greatest_teardown_cb *teardown;
-    void *teardown_udata;
-
-    /* formatting info for ".....s...F"-style output */
-    unsigned int col;
-    unsigned int width;
-
-    /* only run a specific suite or test */
-    const char *suite_filter;
-    const char *test_filter;
-
-#if GREATEST_USE_TIME
-    /* overall timers */
-    clock_t begin;
-    clock_t end;
-#endif
-
-#if GREATEST_USE_LONGJMP
-    jmp_buf jump_dest;
-#endif
-} greatest_run_info;
-
-struct greatest_report_t {
-    /* overall pass/fail/skip counts */
-    unsigned int passed;
-    unsigned int failed;
-    unsigned int skipped;
-    unsigned int assertions;
-};
-
-/* Global var for the current testing context.
- * Initialized by GREATEST_MAIN_DEFS(). */
-extern greatest_run_info greatest_info;
-
-/* Type for ASSERT_ENUM_EQ's ENUM_STR argument. */
-typedef const char *greatest_enum_str_fun(int value);
-
-/**********************
- * Exported functions *
- **********************/
-
-/* These are used internally by greatest. */
-void greatest_do_pass(const char *name);
-void greatest_do_fail(const char *name);
-void greatest_do_skip(const char *name);
-int greatest_pre_test(const char *name);
-void greatest_post_test(const char *name, int res);
-void greatest_usage(const char *name);
-int greatest_do_assert_equal_t(const void *exp, const void *got,
-    greatest_type_info *type_info, void *udata);
-
-/* These are part of the public greatest API. */
-void GREATEST_SET_SETUP_CB(greatest_setup_cb *cb, void *udata);
-void GREATEST_SET_TEARDOWN_CB(greatest_teardown_cb *cb, void *udata);
-int greatest_all_passed(void);
-void greatest_set_test_filter(const char *name);
-void greatest_set_suite_filter(const char *name);
-void greatest_get_report(struct greatest_report_t *report);
-unsigned int greatest_get_verbosity(void);
-void greatest_set_verbosity(unsigned int verbosity);
-void greatest_set_flag(greatest_flag_t flag);
-
-
-/********************
-* Language Support *
-********************/
-
-/* If __VA_ARGS__ (C99) is supported, allow parametric testing
-* without needing to manually manage the argument struct. */
-#if __STDC_VERSION__ >= 19901L || _MSC_VER >= 1800
-#define GREATEST_VA_ARGS
-#endif
-
-
-/**********
- * Macros *
- **********/
-
-/* Define a suite. */
-#define GREATEST_SUITE(NAME) void NAME(void); void NAME(void)
-
-/* Declare a suite, provided by another compilation unit. */
-#define GREATEST_SUITE_EXTERN(NAME) void NAME(void)
-
-/* Start defining a test function.
- * The arguments are not included, to allow parametric testing. */
-#define GREATEST_TEST static enum greatest_test_res
-
-/* PASS/FAIL/SKIP result from a test. Used internally. */
-typedef enum greatest_test_res {
-    GREATEST_TEST_RES_PASS = 0,
-    GREATEST_TEST_RES_FAIL = -1,
-    GREATEST_TEST_RES_SKIP = 1
-} greatest_test_res;
-
-/* Run a suite. */
-#define GREATEST_RUN_SUITE(S_NAME) greatest_run_suite(S_NAME, #S_NAME)
-
-/* Run a test in the current suite. */
-#define GREATEST_RUN_TEST(TEST)                                         \
-    do {                                                                \
-        if (greatest_pre_test(#TEST) == 1) {                            \
-            enum greatest_test_res res = GREATEST_SAVE_CONTEXT();       \
-            if (res == GREATEST_TEST_RES_PASS) {                        \
-                res = TEST();                                           \
-            }                                                           \
-            greatest_post_test(#TEST, res);                             \
-        } else if (GREATEST_LIST_ONLY()) {                              \
-            fprintf(GREATEST_STDOUT, "  %s\n", #TEST);                  \
-        }                                                               \
-    } while (0)
-
-/* Ignore a test, don't warn about it being unused. */
-#define GREATEST_IGNORE_TEST(TEST) (void)TEST
-
-/* Run a test in the current suite with one void * argument,
- * which can be a pointer to a struct with multiple arguments. */
-#define GREATEST_RUN_TEST1(TEST, ENV)                                   \
-    do {                                                                \
-        if (greatest_pre_test(#TEST) == 1) {                            \
-            int res = TEST(ENV);                                        \
-            greatest_post_test(#TEST, res);                             \
-        } else if (GREATEST_LIST_ONLY()) {                              \
-            fprintf(GREATEST_STDOUT, "  %s\n", #TEST);                  \
-        }                                                               \
-    } while (0)
-
-#ifdef GREATEST_VA_ARGS
-#define GREATEST_RUN_TESTp(TEST, ...)                                   \
-    do {                                                                \
-        if (greatest_pre_test(#TEST) == 1) {                            \
-            int res = TEST(__VA_ARGS__);                                \
-            greatest_post_test(#TEST, res);                             \
-        } else if (GREATEST_LIST_ONLY()) {                              \
-            fprintf(GREATEST_STDOUT, "  %s\n", #TEST);                  \
-        }                                                               \
-    } while (0)
-#endif
-
-
-/* Check if the test runner is in verbose mode. */
-#define GREATEST_IS_VERBOSE() ((greatest_info.verbosity) > 0)
-#define GREATEST_LIST_ONLY()                                            \
-    (greatest_info.flags & GREATEST_FLAG_LIST_ONLY)
-#define GREATEST_FIRST_FAIL()                                           \
-    (greatest_info.flags & GREATEST_FLAG_FIRST_FAIL)
-#define GREATEST_FAILURE_ABORT()                                        \
-    (greatest_info.suite.failed > 0 && GREATEST_FIRST_FAIL())
-
-/* Message-less forms of tests defined below. */
-#define GREATEST_PASS() GREATEST_PASSm(NULL)
-#define GREATEST_FAIL() GREATEST_FAILm(NULL)
-#define GREATEST_SKIP() GREATEST_SKIPm(NULL)
-#define GREATEST_ASSERT(COND)                                           \
-    GREATEST_ASSERTm(#COND, COND)
-#define GREATEST_ASSERT_OR_LONGJMP(COND)                                \
-    GREATEST_ASSERT_OR_LONGJMPm(#COND, COND)
-#define GREATEST_ASSERT_FALSE(COND)                                     \
-    GREATEST_ASSERT_FALSEm(#COND, COND)
-#define GREATEST_ASSERT_EQ(EXP, GOT)                                    \
-    GREATEST_ASSERT_EQm(#EXP " != " #GOT, EXP, GOT)
-#define GREATEST_ASSERT_EQ_FMT(EXP, GOT, FMT)                           \
-    GREATEST_ASSERT_EQ_FMTm(#EXP " != " #GOT, EXP, GOT, FMT)
-#define GREATEST_ASSERT_IN_RANGE(EXP, GOT, TOL)                         \
-    GREATEST_ASSERT_IN_RANGEm(#EXP " != " #GOT " +/- " #TOL, EXP, GOT, TOL)
-#define GREATEST_ASSERT_EQUAL_T(EXP, GOT, TYPE_INFO, UDATA)             \
-    GREATEST_ASSERT_EQUAL_Tm(#EXP " != " #GOT, EXP, GOT, TYPE_INFO, UDATA)
-#define GREATEST_ASSERT_STR_EQ(EXP, GOT)                                \
-    GREATEST_ASSERT_STR_EQm(#EXP " != " #GOT, EXP, GOT)
-#define GREATEST_ASSERT_STRN_EQ(EXP, GOT, SIZE)                         \
-    GREATEST_ASSERT_STRN_EQm(#EXP " != " #GOT, EXP, GOT, SIZE)
-#define GREATEST_ASSERT_MEM_EQ(EXP, GOT, SIZE)                          \
-    GREATEST_ASSERT_MEM_EQm(#EXP " != " #GOT, EXP, GOT, SIZE)
-#define GREATEST_ASSERT_ENUM_EQ(EXP, GOT, ENUM_STR)                     \
-    GREATEST_ASSERT_ENUM_EQm(#EXP " != " #GOT, EXP, GOT, ENUM_STR)
-
-/* The following forms take an additional message argument first,
- * to be displayed by the test runner. */
-
-/* Fail if a condition is not true, with message. */
-#define GREATEST_ASSERTm(MSG, COND)                                     \
-    do {                                                                \
-        greatest_info.assertions++;                                     \
-        if (!(COND)) { GREATEST_FAILm(MSG); }                           \
-    } while (0)
-
-/* Fail if a condition is not true, longjmping out of test. */
-#define GREATEST_ASSERT_OR_LONGJMPm(MSG, COND)                          \
-    do {                                                                \
-        greatest_info.assertions++;                                     \
-        if (!(COND)) { GREATEST_FAIL_WITH_LONGJMPm(MSG); }              \
-    } while (0)
-
-/* Fail if a condition is not false, with message. */
-#define GREATEST_ASSERT_FALSEm(MSG, COND)                               \
-    do {                                                                \
-        greatest_info.assertions++;                                     \
-        if ((COND)) { GREATEST_FAILm(MSG); }                            \
-    } while (0)
-
-/* Fail if EXP != GOT (equality comparison by ==). */
-#define GREATEST_ASSERT_EQm(MSG, EXP, GOT)                              \
-    do {                                                                \
-        greatest_info.assertions++;                                     \
-        if ((EXP) != (GOT)) { GREATEST_FAILm(MSG); }                    \
-    } while (0)
-
-/* Fail if EXP != GOT (equality comparison by ==).
- * Warning: EXP and GOT will be evaluated more than once on failure. */
-#define GREATEST_ASSERT_EQ_FMTm(MSG, EXP, GOT, FMT)                     \
-    do {                                                                \
-        const char *greatest_FMT = ( FMT );                             \
-        greatest_info.assertions++;                                     \
-        if ((EXP) != (GOT)) {                                           \
-            fprintf(GREATEST_STDOUT, "\nExpected: ");                   \
-            fprintf(GREATEST_STDOUT, greatest_FMT, EXP);                \
-            fprintf(GREATEST_STDOUT, "\n     Got: ");                   \
-            fprintf(GREATEST_STDOUT, greatest_FMT, GOT);                \
-            fprintf(GREATEST_STDOUT, "\n");                             \
-            GREATEST_FAILm(MSG);                                        \
-        }                                                               \
-    } while (0)
-
-/* Fail if EXP is not equal to GOT, printing enum IDs. */
-#define GREATEST_ASSERT_ENUM_EQm(MSG, EXP, GOT, ENUM_STR)               \
-    do {                                                                \
-        int greatest_EXP = (int)(EXP);                                  \
-        int greatest_GOT = (int)(GOT);                                  \
-        greatest_enum_str_fun *greatest_ENUM_STR = ENUM_STR;            \
-        if (greatest_EXP != greatest_GOT) {                             \
-            fprintf(GREATEST_STDOUT, "\nExpected: %s",                  \
-                greatest_ENUM_STR(greatest_EXP));                       \
-            fprintf(GREATEST_STDOUT, "\n     Got: %s\n",                \
-                greatest_ENUM_STR(greatest_GOT));                       \
-            GREATEST_FAILm(MSG);                                        \
-        }                                                               \
-    } while (0)                                                         \
-
-/* Fail if GOT not in range of EXP +|- TOL. */
-#define GREATEST_ASSERT_IN_RANGEm(MSG, EXP, GOT, TOL)                   \
-    do {                                                                \
-        GREATEST_FLOAT greatest_EXP = (EXP);                            \
-        GREATEST_FLOAT greatest_GOT = (GOT);                            \
-        GREATEST_FLOAT greatest_TOL = (TOL);                            \
-        greatest_info.assertions++;                                     \
-        if ((greatest_EXP > greatest_GOT &&                             \
-                greatest_EXP - greatest_GOT > greatest_TOL) ||          \
-            (greatest_EXP < greatest_GOT &&                             \
-                greatest_GOT - greatest_EXP > greatest_TOL)) {          \
-            fprintf(GREATEST_STDOUT,                                    \
-                "\nExpected: " GREATEST_FLOAT_FMT                       \
-                " +/- " GREATEST_FLOAT_FMT                              \
-                "\n     Got: " GREATEST_FLOAT_FMT                       \
-                "\n",                                                   \
-                greatest_EXP, greatest_TOL, greatest_GOT);              \
-            GREATEST_FAILm(MSG);                                        \
-        }                                                               \
-    } while (0)
-
-/* Fail if EXP is not equal to GOT, according to strcmp. */
-#define GREATEST_ASSERT_STR_EQm(MSG, EXP, GOT)                          \
-    do {                                                                \
-        GREATEST_ASSERT_EQUAL_Tm(MSG, EXP, GOT,                         \
-            &greatest_type_info_string, NULL);                          \
-    } while (0)                                                         \
-
-/* Fail if EXP is not equal to GOT, according to strcmp. */
-#define GREATEST_ASSERT_STRN_EQm(MSG, EXP, GOT, SIZE)                   \
-    do {                                                                \
-        size_t size = SIZE;                                             \
-        GREATEST_ASSERT_EQUAL_Tm(MSG, EXP, GOT,                         \
-            &greatest_type_info_string, &size);                         \
-    } while (0)                                                         \
-
-/* Fail if EXP is not equal to GOT, according to memcmp. */
-#define GREATEST_ASSERT_MEM_EQm(MSG, EXP, GOT, SIZE)                    \
-    do {                                                                \
-        greatest_memory_cmp_env env;                                    \
-        env.exp = (const unsigned char *)EXP;                           \
-        env.got = (const unsigned char *)GOT;                           \
-        env.size = SIZE;                                                \
-        GREATEST_ASSERT_EQUAL_Tm(MSG, env.exp, env.got,                 \
-            &greatest_type_info_memory, &env);                          \
-    } while (0)                                                         \
-
-/* Fail if EXP is not equal to GOT, according to a comparison
- * callback in TYPE_INFO. If they are not equal, optionally use a
- * print callback in TYPE_INFO to print them. */
-#define GREATEST_ASSERT_EQUAL_Tm(MSG, EXP, GOT, TYPE_INFO, UDATA)       \
-    do {                                                                \
-        greatest_type_info *type_info = (TYPE_INFO);                    \
-        greatest_info.assertions++;                                     \
-        if (!greatest_do_assert_equal_t(EXP, GOT,                       \
-                type_info, UDATA)) {                                    \
-            if (type_info == NULL || type_info->equal == NULL) {        \
-                GREATEST_FAILm("type_info->equal callback missing!");   \
-            } else {                                                    \
-                GREATEST_FAILm(MSG);                                    \
-            }                                                           \
-        }                                                               \
-    } while (0)                                                         \
-
-/* Pass. */
-#define GREATEST_PASSm(MSG)                                             \
-    do {                                                                \
-        greatest_info.msg = MSG;                                        \
-        return GREATEST_TEST_RES_PASS;                                  \
-    } while (0)
-
-/* Fail. */
-#define GREATEST_FAILm(MSG)                                             \
-    do {                                                                \
-        greatest_info.fail_file = __FILE__;                             \
-        greatest_info.fail_line = __LINE__;                             \
-        greatest_info.msg = MSG;                                        \
-        return GREATEST_TEST_RES_FAIL;                                  \
-    } while (0)
-
-/* Optional GREATEST_FAILm variant that longjmps. */
-#if GREATEST_USE_LONGJMP
-#define GREATEST_FAIL_WITH_LONGJMP() GREATEST_FAIL_WITH_LONGJMPm(NULL)
-#define GREATEST_FAIL_WITH_LONGJMPm(MSG)                                \
-    do {                                                                \
-        greatest_info.fail_file = __FILE__;                             \
-        greatest_info.fail_line = __LINE__;                             \
-        greatest_info.msg = MSG;                                        \
-        longjmp(greatest_info.jump_dest, GREATEST_TEST_RES_FAIL);       \
-    } while (0)
-#endif
-
-/* Skip the current test. */
-#define GREATEST_SKIPm(MSG)                                             \
-    do {                                                                \
-        greatest_info.msg = MSG;                                        \
-        return GREATEST_TEST_RES_SKIP;                                  \
-    } while (0)
-
-/* Check the result of a subfunction using ASSERT, etc. */
-#define GREATEST_CHECK_CALL(RES)                                        \
-    do {                                                                \
-        enum greatest_test_res greatest_RES = RES;                      \
-        if (greatest_RES != GREATEST_TEST_RES_PASS) {                   \
-            return greatest_RES;                                        \
-        }                                                               \
-    } while (0)                                                         \
-
-#if GREATEST_USE_TIME
-#define GREATEST_SET_TIME(NAME)                                         \
-    NAME = clock();                                                     \
-    if (NAME == (clock_t) -1) {                                         \
-        fprintf(GREATEST_STDOUT,                                        \
-            "clock error: %s\n", #NAME);                                \
-        exit(EXIT_FAILURE);                                             \
-    }
-
-#define GREATEST_CLOCK_DIFF(C1, C2)                                     \
-    fprintf(GREATEST_STDOUT, " (%lu ticks, %.3f sec)",                  \
-        (long unsigned int) (C2) - (long unsigned int)(C1),             \
-        (double)((C2) - (C1)) / (1.0 * (double)CLOCKS_PER_SEC))
-#else
-#define GREATEST_SET_TIME(UNUSED)
-#define GREATEST_CLOCK_DIFF(UNUSED1, UNUSED2)
-#endif
-
-#if GREATEST_USE_LONGJMP
-#define GREATEST_SAVE_CONTEXT()                                         \
-        /* setjmp returns 0 (GREATEST_TEST_RES_PASS) on first call */   \
-        /* so the test runs, then RES_FAIL from FAIL_WITH_LONGJMP. */   \
-        ((enum greatest_test_res)(setjmp(greatest_info.jump_dest)))
-#else
-#define GREATEST_SAVE_CONTEXT()                                         \
-    /*a no-op, since setjmp/longjmp aren't being used */                \
-    GREATEST_TEST_RES_PASS
-#endif
-
-/* Include several function definitions in the main test file. */
-#define GREATEST_MAIN_DEFS()                                            \
-                                                                        \
-/* Is FILTER a subset of NAME? */                                       \
-static int greatest_name_match(const char *name,                        \
-    const char *filter) {                                               \
-    size_t offset = 0;                                                  \
-    size_t filter_len = strlen(filter);                                 \
-    while (name[offset] != '\0') {                                      \
-        if (name[offset] == filter[0]) {                                \
-            if (0 == strncmp(&name[offset], filter, filter_len)) {      \
-                return 1;                                               \
-            }                                                           \
-        }                                                               \
-        offset++;                                                       \
-    }                                                                   \
-                                                                        \
-    return 0;                                                           \
-}                                                                       \
-                                                                        \
-int greatest_pre_test(const char *name) {                               \
-    if (!GREATEST_LIST_ONLY()                                           \
-        && (!GREATEST_FIRST_FAIL() || greatest_info.suite.failed == 0)  \
-        && (greatest_info.test_filter == NULL ||                        \
-            greatest_name_match(name, greatest_info.test_filter))) {    \
-        GREATEST_SET_TIME(greatest_info.suite.pre_test);                \
-        if (greatest_info.setup) {                                      \
-            greatest_info.setup(greatest_info.setup_udata);             \
-        }                                                               \
-        return 1;               /* test should be run */                \
-    } else {                                                            \
-        return 0;               /* skipped */                           \
-    }                                                                   \
-}                                                                       \
-                                                                        \
-void greatest_post_test(const char *name, int res) {                    \
-    GREATEST_SET_TIME(greatest_info.suite.post_test);                   \
-    if (greatest_info.teardown) {                                       \
-        void *udata = greatest_info.teardown_udata;                     \
-        greatest_info.teardown(udata);                                  \
-    }                                                                   \
-                                                                        \
-    if (res <= GREATEST_TEST_RES_FAIL) {                                \
-        greatest_do_fail(name);                                         \
-    } else if (res >= GREATEST_TEST_RES_SKIP) {                         \
-        greatest_do_skip(name);                                         \
-    } else if (res == GREATEST_TEST_RES_PASS) {                         \
-        greatest_do_pass(name);                                         \
-    }                                                                   \
-    greatest_info.suite.tests_run++;                                    \
-    greatest_info.col++;                                                \
-    if (GREATEST_IS_VERBOSE()) {                                        \
-        GREATEST_CLOCK_DIFF(greatest_info.suite.pre_test,               \
-            greatest_info.suite.post_test);                             \
-        fprintf(GREATEST_STDOUT, "\n");                                 \
-    } else if (greatest_info.col % greatest_info.width == 0) {          \
-        fprintf(GREATEST_STDOUT, "\n");                                 \
-        greatest_info.col = 0;                                          \
-    }                                                                   \
-    if (GREATEST_STDOUT == stdout) fflush(stdout);                      \
-}                                                                       \
-                                                                        \
-static void report_suite(void) {                                        \
-    if (greatest_info.suite.tests_run > 0) {                            \
-        fprintf(GREATEST_STDOUT,                                        \
-            "\n%u test%s - %u passed, %u failed, %u skipped",           \
-            greatest_info.suite.tests_run,                              \
-            greatest_info.suite.tests_run == 1 ? "" : "s",              \
-            greatest_info.suite.passed,                                 \
-            greatest_info.suite.failed,                                 \
-            greatest_info.suite.skipped);                               \
-        GREATEST_CLOCK_DIFF(greatest_info.suite.pre_suite,              \
-            greatest_info.suite.post_suite);                            \
-        fprintf(GREATEST_STDOUT, "\n");                                 \
-    }                                                                   \
-}                                                                       \
-                                                                        \
-static void update_counts_and_reset_suite(void) {                       \
-    greatest_info.setup = NULL;                                         \
-    greatest_info.setup_udata = NULL;                                   \
-    greatest_info.teardown = NULL;                                      \
-    greatest_info.teardown_udata = NULL;                                \
-    greatest_info.passed += greatest_info.suite.passed;                 \
-    greatest_info.failed += greatest_info.suite.failed;                 \
-    greatest_info.skipped += greatest_info.suite.skipped;               \
-    greatest_info.tests_run += greatest_info.suite.tests_run;           \
-    memset(&greatest_info.suite, 0, sizeof(greatest_info.suite));       \
-    greatest_info.col = 0;                                              \
-}                                                                       \
-                                                                        \
-static void greatest_run_suite(greatest_suite_cb *suite_cb,             \
-                               const char *suite_name) {                \
-    if (greatest_info.suite_filter &&                                   \
-        !greatest_name_match(suite_name, greatest_info.suite_filter)) { \
-        return;                                                         \
-    }                                                                   \
-    update_counts_and_reset_suite();                                    \
-    if (GREATEST_FIRST_FAIL() && greatest_info.failed > 0) { return; }  \
-    fprintf(GREATEST_STDOUT, "\n* Suite %s:\n", suite_name);            \
-    GREATEST_SET_TIME(greatest_info.suite.pre_suite);                   \
-    suite_cb();                                                         \
-    GREATEST_SET_TIME(greatest_info.suite.post_suite);                  \
-    report_suite();                                                     \
-}                                                                       \
-                                                                        \
-void greatest_do_pass(const char *name) {                               \
-    if (GREATEST_IS_VERBOSE()) {                                        \
-        fprintf(GREATEST_STDOUT, "PASS %s: %s",                         \
-            name, greatest_info.msg ? greatest_info.msg : "");          \
-    } else {                                                            \
-        fprintf(GREATEST_STDOUT, ".");                                  \
-    }                                                                   \
-    greatest_info.suite.passed++;                                       \
-}                                                                       \
-                                                                        \
-void greatest_do_fail(const char *name) {                               \
-    if (GREATEST_IS_VERBOSE()) {                                        \
-        fprintf(GREATEST_STDOUT,                                        \
-            "FAIL %s: %s (%s:%u)",                                      \
-            name, greatest_info.msg ? greatest_info.msg : "",           \
-            greatest_info.fail_file, greatest_info.fail_line);          \
-    } else {                                                            \
-        fprintf(GREATEST_STDOUT, "F");                                  \
-        greatest_info.col++;                                            \
-        /* add linebreak if in line of '.'s */                          \
-        if (greatest_info.col != 0) {                                   \
-            fprintf(GREATEST_STDOUT, "\n");                             \
-            greatest_info.col = 0;                                      \
-        }                                                               \
-        fprintf(GREATEST_STDOUT, "FAIL %s: %s (%s:%u)\n",               \
-            name,                                                       \
-            greatest_info.msg ? greatest_info.msg : "",                 \
-            greatest_info.fail_file, greatest_info.fail_line);          \
-    }                                                                   \
-    greatest_info.suite.failed++;                                       \
-}                                                                       \
-                                                                        \
-void greatest_do_skip(const char *name) {                               \
-    if (GREATEST_IS_VERBOSE()) {                                        \
-        fprintf(GREATEST_STDOUT, "SKIP %s: %s",                         \
-            name,                                                       \
-            greatest_info.msg ?                                         \
-            greatest_info.msg : "" );                                   \
-    } else {                                                            \
-        fprintf(GREATEST_STDOUT, "s");                                  \
-    }                                                                   \
-    greatest_info.suite.skipped++;                                      \
-}                                                                       \
-                                                                        \
-int greatest_do_assert_equal_t(const void *exp, const void *got,        \
-        greatest_type_info *type_info, void *udata) {                   \
-    int eq = 0;                                                         \
-    if (type_info == NULL || type_info->equal == NULL) {                \
-        return 0;                                                       \
-    }                                                                   \
-    eq = type_info->equal(exp, got, udata);                             \
-    if (!eq) {                                                          \
-        if (type_info->print != NULL) {                                 \
-            fprintf(GREATEST_STDOUT, "\nExpected: ");                   \
-            (void)type_info->print(exp, udata);                         \
-            fprintf(GREATEST_STDOUT, "\n     Got: ");                   \
-            (void)type_info->print(got, udata);                         \
-            fprintf(GREATEST_STDOUT, "\n");                             \
-        } else {                                                        \
-            fprintf(GREATEST_STDOUT,                                    \
-                "GREATEST_ASSERT_EQUAL_T failure at %s:%u\n",           \
-                greatest_info.fail_file,                                \
-                greatest_info.fail_line);                               \
-        }                                                               \
-    }                                                                   \
-    return eq;                                                          \
-}                                                                       \
-                                                                        \
-void greatest_usage(const char *name) {                                 \
-    fprintf(GREATEST_STDOUT,                                            \
-        "Usage: %s [-hlfv] [-s SUITE] [-t TEST]\n"                      \
-        "  -h, --help  print this Help\n"                               \
-        "  -l          List suites and their tests, then exit\n"        \
-        "  -f          Stop runner after first failure\n"               \
-        "  -v          Verbose output\n"                                \
-        "  -s SUITE    only run suites containing string SUITE\n"       \
-        "  -t TEST     only run tests containing string TEST\n",        \
-        name);                                                          \
-}                                                                       \
-                                                                        \
-static void greatest_parse_args(int argc, char **argv) {                \
-    int i = 0;                                                          \
-    for (i = 1; i < argc; i++) {                                        \
-        if (0 == strncmp("-t", argv[i], 2)) {                           \
-            if (argc <= i + 1) {                                        \
-                greatest_usage(argv[0]);                                \
-                exit(EXIT_FAILURE);                                     \
-            }                                                           \
-            greatest_info.test_filter = argv[i+1];                      \
-            i++;                                                        \
-        } else if (0 == strncmp("-s", argv[i], 2)) {                    \
-            if (argc <= i + 1) {                                        \
-                greatest_usage(argv[0]);                                \
-                exit(EXIT_FAILURE);                                     \
-            }                                                           \
-            greatest_info.suite_filter = argv[i+1];                     \
-            i++;                                                        \
-        } else if (0 == strncmp("-f", argv[i], 2)) {                    \
-            greatest_info.flags |= GREATEST_FLAG_FIRST_FAIL;            \
-        } else if (0 == strncmp("-v", argv[i], 2)) {                    \
-            greatest_info.verbosity++;                                  \
-        } else if (0 == strncmp("-l", argv[i], 2)) {                    \
-            greatest_info.flags |= GREATEST_FLAG_LIST_ONLY;             \
-        } else if (0 == strncmp("-h", argv[i], 2) ||                    \
-                   0 == strncmp("--help", argv[i], 6)) {                \
-            greatest_usage(argv[0]);                                    \
-            exit(EXIT_SUCCESS);                                         \
-        } else if (0 == strncmp("--", argv[i], 2)) {                    \
-            break;                                                      \
-        } else {                                                        \
-            fprintf(GREATEST_STDOUT,                                    \
-                "Unknown argument '%s'\n", argv[i]);                    \
-            greatest_usage(argv[0]);                                    \
-            exit(EXIT_FAILURE);                                         \
-        }                                                               \
-    }                                                                   \
-}                                                                       \
-                                                                        \
-int greatest_all_passed(void) { return (greatest_info.failed == 0); }   \
-                                                                        \
-void greatest_set_test_filter(const char *name) {                       \
-    greatest_info.test_filter = name;                                   \
-}                                                                       \
-                                                                        \
-void greatest_set_suite_filter(const char *name) {                      \
-    greatest_info.suite_filter = name;                                  \
-}                                                                       \
-                                                                        \
-void greatest_get_report(struct greatest_report_t *report) {            \
-    if (report) {                                                       \
-        report->passed = greatest_info.passed;                          \
-        report->failed = greatest_info.failed;                          \
-        report->skipped = greatest_info.skipped;                        \
-        report->assertions = greatest_info.assertions;                  \
-    }                                                                   \
-}                                                                       \
-                                                                        \
-unsigned int greatest_get_verbosity(void) {                             \
-    return greatest_info.verbosity;                                     \
-}                                                                       \
-                                                                        \
-void greatest_set_verbosity(unsigned int verbosity) {                   \
-    greatest_info.verbosity = (unsigned char)verbosity;                 \
-}                                                                       \
-                                                                        \
-void greatest_set_flag(greatest_flag_t flag) {                          \
-    greatest_info.flags |= flag;                                        \
-}                                                                       \
-                                                                        \
-void GREATEST_SET_SETUP_CB(greatest_setup_cb *cb, void *udata) {        \
-    greatest_info.setup = cb;                                           \
-    greatest_info.setup_udata = udata;                                  \
-}                                                                       \
-                                                                        \
-void GREATEST_SET_TEARDOWN_CB(greatest_teardown_cb *cb,                 \
-                                    void *udata) {                      \
-    greatest_info.teardown = cb;                                        \
-    greatest_info.teardown_udata = udata;                               \
-}                                                                       \
-                                                                        \
-static int greatest_string_equal_cb(const void *exp, const void *got,   \
-    void *udata) {                                                      \
-    size_t *size = (size_t *)udata;                                     \
-    return (size != NULL                                                \
-        ? (0 == strncmp((const char *)exp, (const char *)got, *size))   \
-        : (0 == strcmp((const char *)exp, (const char *)got)));         \
-}                                                                       \
-                                                                        \
-static int greatest_string_printf_cb(const void *t, void *udata) {      \
-    (void)udata; /* note: does not check \0 termination. */             \
-    return fprintf(GREATEST_STDOUT, "%s", (const char *)t);             \
-}                                                                       \
-                                                                        \
-greatest_type_info greatest_type_info_string = {                        \
-    greatest_string_equal_cb,                                           \
-    greatest_string_printf_cb,                                          \
-};                                                                      \
-                                                                        \
-static int greatest_memory_equal_cb(const void *exp, const void *got,   \
-    void *udata) {                                                      \
-    greatest_memory_cmp_env *env = (greatest_memory_cmp_env *)udata;    \
-    return (0 == memcmp(exp, got, env->size));                          \
-}                                                                       \
-                                                                        \
-static int greatest_memory_printf_cb(const void *t, void *udata) {      \
-    greatest_memory_cmp_env *env = (greatest_memory_cmp_env *)udata;    \
-    unsigned char *buf = (unsigned char *)t, diff_mark = ' ';           \
-    FILE *out = GREATEST_STDOUT;                                        \
-    size_t i, line_i, line_len = 0;                                     \
-    int len = 0;   /* format hexdump with differences highlighted */    \
-    for (i = 0; i < env->size; i+= line_len) {                          \
-        diff_mark = ' ';                                                \
-        line_len = env->size - i;                                       \
-        if (line_len > 16) { line_len = 16; }                           \
-        for (line_i = i; line_i < i + line_len; line_i++) {             \
-            if (env->exp[line_i] != env->got[line_i]) diff_mark = 'X';  \
-        }                                                               \
-        len += fprintf(out, "\n%04x %c ", (unsigned int)i, diff_mark);  \
-        for (line_i = i; line_i < i + line_len; line_i++) {             \
-            int m = env->exp[line_i] == env->got[line_i]; /* match? */  \
-            len += fprintf(out, "%02x%c", buf[line_i], m ? ' ' : '<');  \
-        }                                                               \
-        for (line_i = 0; line_i < 16 - line_len; line_i++) {            \
-            len += fprintf(out, "   ");                                 \
-        }                                                               \
-        fprintf(out, " ");                                              \
-        for (line_i = i; line_i < i + line_len; line_i++) {             \
-            unsigned char c = buf[line_i];                              \
-            len += fprintf(out, "%c", isprint(c) ? c : '.');            \
-        }                                                               \
-    }                                                                   \
-    len += fprintf(out, "\n");                                          \
-    return len;                                                         \
-}                                                                       \
-                                                                        \
-greatest_type_info greatest_type_info_memory = {                        \
-    greatest_memory_equal_cb,                                           \
-    greatest_memory_printf_cb,                                          \
-};                                                                      \
-                                                                        \
-greatest_run_info greatest_info
-
-/* Init internals. */
-#define GREATEST_INIT()                                                 \
-    do {                                                                \
-        /* Suppress unused function warning if features aren't used */  \
-        (void)greatest_run_suite;                                       \
-        (void)greatest_parse_args;                                      \
-                                                                        \
-        memset(&greatest_info, 0, sizeof(greatest_info));               \
-        greatest_info.width = GREATEST_DEFAULT_WIDTH;                   \
-        GREATEST_SET_TIME(greatest_info.begin);                         \
-    } while (0)                                                         \
-
-/* Handle command-line arguments, etc. */
-#define GREATEST_MAIN_BEGIN()                                           \
-    do {                                                                \
-        GREATEST_INIT();                                                \
-        greatest_parse_args(argc, argv);                                \
-    } while (0)
-
-/* Report passes, failures, skipped tests, the number of
- * assertions, and the overall run time. */
-#define GREATEST_PRINT_REPORT()                                         \
-    do {                                                                \
-        if (!GREATEST_LIST_ONLY()) {                                    \
-            update_counts_and_reset_suite();                            \
-            GREATEST_SET_TIME(greatest_info.end);                       \
-            fprintf(GREATEST_STDOUT,                                    \
-                "\nTotal: %u test%s",                                   \
-                greatest_info.tests_run,                                \
-                greatest_info.tests_run == 1 ? "" : "s");               \
-            GREATEST_CLOCK_DIFF(greatest_info.begin,                    \
-                greatest_info.end);                                     \
-            fprintf(GREATEST_STDOUT, ", %u assertion%s\n",              \
-                greatest_info.assertions,                               \
-                greatest_info.assertions == 1 ? "" : "s");              \
-            fprintf(GREATEST_STDOUT,                                    \
-                "Pass: %u, fail: %u, skip: %u.\n",                      \
-                greatest_info.passed,                                   \
-                greatest_info.failed, greatest_info.skipped);           \
-        }                                                               \
-    } while (0)
-
-/* Report results, exit with exit status based on results. */
-#define GREATEST_MAIN_END()                                             \
-    do {                                                                \
-        GREATEST_PRINT_REPORT();                                        \
-        return (greatest_all_passed() ? EXIT_SUCCESS : EXIT_FAILURE);   \
-    } while (0)
-
-/* Make abbreviations without the GREATEST_ prefix for the
- * most commonly used symbols. */
-#if GREATEST_USE_ABBREVS
-#define TEST           GREATEST_TEST
-#define SUITE          GREATEST_SUITE
-#define SUITE_EXTERN   GREATEST_SUITE_EXTERN
-#define RUN_TEST       GREATEST_RUN_TEST
-#define RUN_TEST1      GREATEST_RUN_TEST1
-#define RUN_SUITE      GREATEST_RUN_SUITE
-#define IGNORE_TEST    GREATEST_IGNORE_TEST
-#define ASSERT         GREATEST_ASSERT
-#define ASSERTm        GREATEST_ASSERTm
-#define ASSERT_FALSE   GREATEST_ASSERT_FALSE
-#define ASSERT_EQ      GREATEST_ASSERT_EQ
-#define ASSERT_EQ_FMT  GREATEST_ASSERT_EQ_FMT
-#define ASSERT_IN_RANGE GREATEST_ASSERT_IN_RANGE
-#define ASSERT_EQUAL_T GREATEST_ASSERT_EQUAL_T
-#define ASSERT_STR_EQ  GREATEST_ASSERT_STR_EQ
-#define ASSERT_STRN_EQ GREATEST_ASSERT_STRN_EQ
-#define ASSERT_MEM_EQ  GREATEST_ASSERT_MEM_EQ
-#define ASSERT_ENUM_EQ GREATEST_ASSERT_ENUM_EQ
-#define ASSERT_FALSEm  GREATEST_ASSERT_FALSEm
-#define ASSERT_EQm     GREATEST_ASSERT_EQm
-#define ASSERT_EQ_FMTm GREATEST_ASSERT_EQ_FMTm
-#define ASSERT_IN_RANGEm GREATEST_ASSERT_IN_RANGEm
-#define ASSERT_EQUAL_Tm GREATEST_ASSERT_EQUAL_Tm
-#define ASSERT_STR_EQm GREATEST_ASSERT_STR_EQm
-#define ASSERT_STRN_EQm GREATEST_ASSERT_STRN_EQm
-#define ASSERT_MEM_EQm GREATEST_ASSERT_MEM_EQm
-#define ASSERT_ENUM_EQm GREATEST_ASSERT_ENUM_EQm
-#define PASS           GREATEST_PASS
-#define FAIL           GREATEST_FAIL
-#define SKIP           GREATEST_SKIP
-#define PASSm          GREATEST_PASSm
-#define FAILm          GREATEST_FAILm
-#define SKIPm          GREATEST_SKIPm
-#define SET_SETUP      GREATEST_SET_SETUP_CB
-#define SET_TEARDOWN   GREATEST_SET_TEARDOWN_CB
-#define CHECK_CALL     GREATEST_CHECK_CALL
-
-#ifdef GREATEST_VA_ARGS
-#define RUN_TESTp      GREATEST_RUN_TESTp
-#endif
-
-#if GREATEST_USE_LONGJMP
-#define ASSERT_OR_LONGJMP  GREATEST_ASSERT_OR_LONGJMP
-#define ASSERT_OR_LONGJMPm GREATEST_ASSERT_OR_LONGJMPm
-#define FAIL_WITH_LONGJMP  GREATEST_FAIL_WITH_LONGJMP
-#define FAIL_WITH_LONGJMPm GREATEST_FAIL_WITH_LONGJMPm
-#endif
-
-#endif /* USE_ABBREVS */
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif
diff --git a/src/common/thirdparty/patches/.gitattributes b/src/common/thirdparty/patches/.gitattributes
deleted file mode 100644
index 9812ceb1ffd9b..0000000000000
--- a/src/common/thirdparty/patches/.gitattributes
+++ /dev/null
@@ -1 +0,0 @@
-*.patch text eol=lf
diff --git a/src/common/thirdparty/patches/windows/python-pyconfig.patch b/src/common/thirdparty/patches/windows/python-pyconfig.patch
deleted file mode 100644
index 4280dee774702..0000000000000
--- a/src/common/thirdparty/patches/windows/python-pyconfig.patch
+++ /dev/null
@@ -1,25 +0,0 @@
-diff --git a/inc/Windows/pyconfig.h b/inc/Windows/pyconfig.h
-index 1cfc59b..d4861cb
---- a/inc/Windows/pyconfig.h
-+++ b/inc/Windows/pyconfig.h
-@@ -1,6 +1,11 @@
- #ifndef Py_CONFIG_H
- #define Py_CONFIG_H
- 
-+#ifdef _MSC_VER
-+#pragma push_macro("_DEBUG")
-+#undef _DEBUG
-+#endif
-+
- /* pyconfig.h.  NOT Generated automatically by configure.
- 
- This is a manually maintained version used for the Watcom,
-@@ -756,4 +761,8 @@ Py_NO_ENABLE_SHARED to find out.  Also support MS_NO_COREDLL for b/w compat */
-    least significant byte first */
- #define DOUBLE_IS_LITTLE_ENDIAN_IEEE754 1
- 
-+#ifdef _MSC_VER
-+#pragma pop_macro("_DEBUG")
-+#endif
-+
- #endif /* !Py_CONFIG_H */
diff --git a/src/common/thirdparty/patches/windows/redis.patch b/src/common/thirdparty/patches/windows/redis.patch
deleted file mode 100644
index 5ed2df5105cf3..0000000000000
--- a/src/common/thirdparty/patches/windows/redis.patch
+++ /dev/null
@@ -1,772 +0,0 @@
-diff --git a/msvs/RedisServer.vcxproj b/msvs/RedisServer.vcxproj
-index 115ce90..68afb44
---- a/msvs/RedisServer.vcxproj
-+++ b/msvs/RedisServer.vcxproj
-@@ -24,26 +24,26 @@
-   </PropertyGroup>
-   <Import Project="$(VCTargetsPath)\Microsoft.Cpp.Default.props" />
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
--    <ConfigurationType>Application</ConfigurationType>
-+    <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>true</UseDebugLibraries>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-     <CLRSupport>false</CLRSupport>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
--    <ConfigurationType>Application</ConfigurationType>
-+    <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>true</UseDebugLibraries>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-     <CLRSupport>false</CLRSupport>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
--    <ConfigurationType>Application</ConfigurationType>
-+    <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>false</UseDebugLibraries>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
--    <ConfigurationType>Application</ConfigurationType>
-+    <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>false</UseDebugLibraries>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-   </PropertyGroup>
-   <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
-   <ImportGroup Label="ExtensionSettings">
-@@ -61,41 +61,23 @@
-     <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
-   </ImportGroup>
-   <PropertyGroup Label="UserMacros" />
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
-+  <PropertyGroup>
-     <LinkIncremental>false</LinkIncremental>
-     <TargetName>redis-server</TargetName>
-     <GenerateManifest>false</GenerateManifest>
--  </PropertyGroup>
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
--    <LinkIncremental>false</LinkIncremental>
--    <TargetName>redis-server</TargetName>
--    <GenerateManifest>false</GenerateManifest>
--    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
--    <IntDir>$(Platform)\$(Configuration)\</IntDir>
--  </PropertyGroup>
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
--    <LinkIncremental>false</LinkIncremental>
--    <TargetName>redis-server</TargetName>
--    <GenerateManifest>false</GenerateManifest>
--    <CustomBuildAfterTargets>Build</CustomBuildAfterTargets>
--  </PropertyGroup>
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
--    <LinkIncremental>false</LinkIncremental>
--    <TargetName>redis-server</TargetName>
--    <GenerateManifest>false</GenerateManifest>
--    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
--    <IntDir>$(Platform)\$(Configuration)\</IntDir>
-+    <OutDir>$(SolutionDir)build\$(Platform)\$(Configuration)\</OutDir>
-+    <IntDir>$(SolutionDir)build\$(Platform)\$(Configuration)\$(MSBuildProjectName)\</IntDir>
-   </PropertyGroup>
-   <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
-     <ClCompile>
--      <PreprocessorDefinitions>USE_JEMALLOC;_OFF_T_DEFINED;WIN32;LACKS_STDLIB_H;_DEBUG;_CONSOLE;__x86_64__;%(PreprocessorDefinitions)</PreprocessorDefinitions>
--      <AdditionalIncludeDirectories>$(SolutionDir)..\deps\lua\src;$(SolutionDir)..\deps\hiredis;$(SolutionDir)..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
--      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;_OFF_T_DEFINED;WIN32;LACKS_STDLIB_H;_DEBUG;_CONSOLE;__x86_64__;%(PreprocessorDefinitions)</PreprocessorDefinitions>
-+      <AdditionalIncludeDirectories>$(ProjectDir)..\deps\lua\src;$(ProjectDir)..\deps\hiredis;$(ProjectDir)..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
-       <WarningLevel>Level3</WarningLevel>
-       <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
-       <Optimization>Disabled</Optimization>
-       <DisableSpecificWarnings>4996;4146</DisableSpecificWarnings>
--      <WholeProgramOptimization>true</WholeProgramOptimization>
-+      <MinimalRebuild>false</MinimalRebuild>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <GenerateDebugInformation>true</GenerateDebugInformation>
-@@ -109,14 +91,14 @@
-   </ItemDefinitionGroup>
-   <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
-     <ClCompile>
--      <PreprocessorDefinitions>USE_JEMALLOC;_OFF_T_DEFINED;WIN32;LACKS_STDLIB_H;_DEBUG;_CONSOLE;__x86_64__;%(PreprocessorDefinitions);_WIN32_WINNT=0x0501</PreprocessorDefinitions>
--      <AdditionalIncludeDirectories>$(SolutionDir)..\deps\lua\src;$(SolutionDir)..\deps\hiredis;$(SolutionDir)..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
--      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;_OFF_T_DEFINED;WIN32;LACKS_STDLIB_H;_DEBUG;_CONSOLE;__x86_64__;%(PreprocessorDefinitions);_WIN32_WINNT=0x0501</PreprocessorDefinitions>
-+      <AdditionalIncludeDirectories>$(ProjectDir)..\deps\lua\src;$(ProjectDir)..\deps\hiredis;$(ProjectDir)..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
-       <WarningLevel>Level3</WarningLevel>
-       <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
-       <Optimization>Disabled</Optimization>
-       <DisableSpecificWarnings>4996;4146</DisableSpecificWarnings>
--      <WholeProgramOptimization>true</WholeProgramOptimization>
-+      <MinimalRebuild>false</MinimalRebuild>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <GenerateDebugInformation>true</GenerateDebugInformation>
-@@ -130,14 +112,13 @@
-   </ItemDefinitionGroup>
-   <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
-     <ClCompile>
--      <PreprocessorDefinitions>USE_JEMALLOC;_OFF_T_DEFINED;WIN32;LACKS_STDLIB_H;NDEBUG;_CONSOLE;__x86_64__;%(PreprocessorDefinitions)</PreprocessorDefinitions>
--      <AdditionalIncludeDirectories>$(SolutionDir)..\deps\lua\src;$(SolutionDir)..\deps\hiredis;$(SolutionDir)..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
--      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;_OFF_T_DEFINED;WIN32;LACKS_STDLIB_H;NDEBUG;_CONSOLE;__x86_64__;%(PreprocessorDefinitions)</PreprocessorDefinitions>
-+      <AdditionalIncludeDirectories>$(ProjectDir)..\deps\lua\src;$(ProjectDir)..\deps\hiredis;$(ProjectDir)..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
-       <WarningLevel>Level3</WarningLevel>
-       <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
-       <DisableSpecificWarnings>4996;4146</DisableSpecificWarnings>
--      <WholeProgramOptimization>true</WholeProgramOptimization>
-       <Optimization>Full</Optimization>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <GenerateDebugInformation>true</GenerateDebugInformation>
-@@ -162,13 +143,12 @@
-   </ItemDefinitionGroup>
-   <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
-     <ClCompile>
--      <PreprocessorDefinitions>USE_JEMALLOC;_OFF_T_DEFINED;_WIN32;LACKS_STDLIB_H;NDEBUG;_CONSOLE;__x86_64__;%(PreprocessorDefinitions);_WIN32_WINNT=0x0501</PreprocessorDefinitions>
--      <AdditionalIncludeDirectories>$(SolutionDir)..\deps\lua\src;$(SolutionDir)..\deps\hiredis;$(SolutionDir)..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
--      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;_OFF_T_DEFINED;_WIN32;LACKS_STDLIB_H;NDEBUG;_CONSOLE;__x86_64__;%(PreprocessorDefinitions);_WIN32_WINNT=0x0501</PreprocessorDefinitions>
-+      <AdditionalIncludeDirectories>$(ProjectDir)..\deps\lua\src;$(ProjectDir)..\deps\hiredis;$(ProjectDir)..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
-       <WarningLevel>Level3</WarningLevel>
-       <DebugInformationFormat>ProgramDatabase</DebugInformationFormat>
-       <DisableSpecificWarnings>4996;4146</DisableSpecificWarnings>
--      <WholeProgramOptimization>true</WholeProgramOptimization>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <GenerateDebugInformation>true</GenerateDebugInformation>
-@@ -271,9 +251,6 @@
-     <ClInclude Include="..\src\zmalloc.h" />
-   </ItemGroup>
-   <ItemGroup>
--    <ProjectReference Include="..\deps\jemalloc-win\projects\jemalloc\proj.win32\vc2013\jemalloc.vcxproj">
--      <Project>{8b897e33-6428-4254-8335-4911d179bad1}</Project>
--    </ProjectReference>
-     <ProjectReference Include="..\src\Win32_Interop\Win32_Interop.vcxproj">
-       <Project>{8c07f811-c81c-432c-b334-1ae6faecf951}</Project>
-     </ProjectReference>
-diff --git a/msvs/hiredis/hiredis.vcxproj b/msvs/hiredis/hiredis.vcxproj
-index 0622958..efaedae
---- a/msvs/hiredis/hiredis.vcxproj
-+++ b/msvs/hiredis/hiredis.vcxproj
-@@ -28,27 +28,25 @@
-     <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>true</UseDebugLibraries>
-     <CharacterSet>MultiByte</CharacterSet>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
-     <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>true</UseDebugLibraries>
-     <CharacterSet>MultiByte</CharacterSet>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
-     <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>false</UseDebugLibraries>
--    <WholeProgramOptimization>true</WholeProgramOptimization>
-     <CharacterSet>MultiByte</CharacterSet>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
-     <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>false</UseDebugLibraries>
--    <WholeProgramOptimization>true</WholeProgramOptimization>
-     <CharacterSet>MultiByte</CharacterSet>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-   </PropertyGroup>
-   <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
-   <ImportGroup Label="ExtensionSettings">
-@@ -66,30 +64,20 @@
-     <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
-   </ImportGroup>
-   <PropertyGroup Label="UserMacros" />
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
-+  <PropertyGroup>
-     <TargetName>hiredis</TargetName>
--  </PropertyGroup>
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
--    <TargetName>hiredis</TargetName>
--    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
--    <IntDir>$(Platform)\$(Configuration)\</IntDir>
--  </PropertyGroup>
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
--    <TargetName>hiredis</TargetName>
--  </PropertyGroup>
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
--    <TargetName>hiredis</TargetName>
--    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
--    <IntDir>$(Platform)\$(Configuration)\</IntDir>
-+    <OutDir>$(ProjectDir)..\$(Platform)\$(Configuration)\</OutDir>
-+    <IntDir>$(SolutionDir)build\$(Platform)\$(Configuration)\$(MSBuildProjectName)\</IntDir>
-   </PropertyGroup>
-   <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
-     <ClCompile>
-       <PrecompiledHeader>NotUsing</PrecompiledHeader>
-       <WarningLevel>Level3</WarningLevel>
-       <Optimization>Disabled</Optimization>
--      <PreprocessorDefinitions>_OFF_T_DEFINED;WIN32;_LIB;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
--      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;_OFF_T_DEFINED;WIN32;_LIB;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
-       <DisableSpecificWarnings>4996</DisableSpecificWarnings>
-+      <MinimalRebuild>false</MinimalRebuild>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <SubSystem>Windows</SubSystem>
-@@ -101,9 +89,10 @@
-       <PrecompiledHeader>NotUsing</PrecompiledHeader>
-       <WarningLevel>Level3</WarningLevel>
-       <Optimization>Disabled</Optimization>
--      <PreprocessorDefinitions>_OFF_T_DEFINED;WIN32;_LIB;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
--      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;_OFF_T_DEFINED;WIN32;_LIB;_DEBUG;%(PreprocessorDefinitions)</PreprocessorDefinitions>
-       <DisableSpecificWarnings>4996</DisableSpecificWarnings>
-+      <MinimalRebuild>false</MinimalRebuild>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <SubSystem>Windows</SubSystem>
-@@ -117,10 +106,9 @@
-       <Optimization>Full</Optimization>
-       <FunctionLevelLinking>true</FunctionLevelLinking>
-       <IntrinsicFunctions>true</IntrinsicFunctions>
--      <PreprocessorDefinitions>_OFF_T_DEFINED;WIN32;_LIB;%(PreprocessorDefinitions)</PreprocessorDefinitions>
--      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;_OFF_T_DEFINED;WIN32;_LIB;%(PreprocessorDefinitions)</PreprocessorDefinitions>
-       <DisableSpecificWarnings>4996</DisableSpecificWarnings>
--      <WholeProgramOptimization>true</WholeProgramOptimization>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <SubSystem>Windows</SubSystem>
-@@ -136,10 +124,9 @@
-       <Optimization>Full</Optimization>
-       <FunctionLevelLinking>true</FunctionLevelLinking>
-       <IntrinsicFunctions>true</IntrinsicFunctions>
--      <PreprocessorDefinitions>_OFF_T_DEFINED;WIN32;_LIB;%(PreprocessorDefinitions)</PreprocessorDefinitions>
--      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;_OFF_T_DEFINED;WIN32;_LIB;%(PreprocessorDefinitions)</PreprocessorDefinitions>
-       <DisableSpecificWarnings>4996</DisableSpecificWarnings>
--      <WholeProgramOptimization>true</WholeProgramOptimization>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <SubSystem>Windows</SubSystem>
-diff --git a/msvs/lua/lua/lua.vcxproj b/msvs/lua/lua/lua.vcxproj
-index b187130..adef07b
---- a/msvs/lua/lua/lua.vcxproj
-+++ b/msvs/lua/lua/lua.vcxproj
-@@ -30,28 +30,28 @@
-     <UseDebugLibraries>true</UseDebugLibraries>
-     <CLRSupport>false</CLRSupport>
-     <CharacterSet>MultiByte</CharacterSet>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
-     <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>true</UseDebugLibraries>
-     <CLRSupport>false</CLRSupport>
-     <CharacterSet>MultiByte</CharacterSet>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
-     <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>false</UseDebugLibraries>
-     <CLRSupport>false</CLRSupport>
-     <CharacterSet>MultiByte</CharacterSet>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
-     <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>false</UseDebugLibraries>
-     <CLRSupport>false</CLRSupport>
-     <CharacterSet>MultiByte</CharacterSet>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-   </PropertyGroup>
-   <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
-   <ImportGroup Label="ExtensionSettings">
-@@ -69,25 +69,16 @@
-     <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
-   </ImportGroup>
-   <PropertyGroup Label="UserMacros" />
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
-+  <PropertyGroup Condition="'$(Configuration)'=='Debug'">
-     <LinkIncremental>true</LinkIncremental>
--    <TargetExt>.lib</TargetExt>
--  </PropertyGroup>
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
--    <LinkIncremental>true</LinkIncremental>
--    <TargetExt>.lib</TargetExt>
--    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
--    <IntDir>$(Platform)\$(Configuration)\</IntDir>
-   </PropertyGroup>
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'">
-+  <PropertyGroup Condition="'$(Configuration)'=='Release'">
-     <LinkIncremental>false</LinkIncremental>
--    <TargetExt>.lib</TargetExt>
-   </PropertyGroup>
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
--    <LinkIncremental>false</LinkIncremental>
-+  <PropertyGroup>
-     <TargetExt>.lib</TargetExt>
--    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
--    <IntDir>$(Platform)\$(Configuration)\</IntDir>
-+    <OutDir>$(SolutionDir)build\$(Platform)\$(Configuration)\</OutDir>
-+    <IntDir>$(SolutionDir)build\$(Platform)\$(Configuration)\$(MSBuildProjectName)\</IntDir>
-   </PropertyGroup>
-   <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
-     <ClCompile>
-@@ -95,8 +86,9 @@
-       <Optimization>Disabled</Optimization>
-       <PreprocessorDefinitions>_OFF_T_DEFINED;WIN32;_DEBUG;_LIB;_CRT_SECURE_NO_WARNINGS;%(PreprocessorDefinitions);LUA_ANSI;ENABLE_CJSON_GLOBAL</PreprocessorDefinitions>
-       <PrecompiledHeader>NotUsing</PrecompiledHeader>
--      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
-       <DisableSpecificWarnings>4244;4018</DisableSpecificWarnings>
-+      <MinimalRebuild>false</MinimalRebuild>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <GenerateDebugInformation>true</GenerateDebugInformation>
-@@ -110,8 +102,9 @@
-       <Optimization>Disabled</Optimization>
-       <PreprocessorDefinitions>_OFF_T_DEFINED;WIN32;_DEBUG;_LIB;_CRT_SECURE_NO_WARNINGS;%(PreprocessorDefinitions);_WIN32_WINNT=0x0501;LUA_ANSI;ENABLE_CJSON_GLOBAL</PreprocessorDefinitions>
-       <PrecompiledHeader>NotUsing</PrecompiledHeader>
--      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
-       <DisableSpecificWarnings>4244;4018</DisableSpecificWarnings>
-+      <MinimalRebuild>false</MinimalRebuild>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <GenerateDebugInformation>true</GenerateDebugInformation>
-@@ -124,10 +117,10 @@
-       <WarningLevel>Level3</WarningLevel>
-       <PreprocessorDefinitions>_OFF_T_DEFINED;WIN32;NDEBUG;_LIB;_CRT_SECURE_NO_WARNINGS;%(PreprocessorDefinitions);LUA_ANSI;ENABLE_CJSON_GLOBAL</PreprocessorDefinitions>
-       <PrecompiledHeader>NotUsing</PrecompiledHeader>
--      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
-       <DisableSpecificWarnings>4244;4018</DisableSpecificWarnings>
-       <Optimization>Full</Optimization>
-       <WholeProgramOptimization>true</WholeProgramOptimization>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <GenerateDebugInformation>true</GenerateDebugInformation>
-@@ -140,8 +133,8 @@
-       <WarningLevel>Level3</WarningLevel>
-       <PreprocessorDefinitions>_OFF_T_DEFINED;WIN32;NDEBUG;_LIB;_CRT_SECURE_NO_WARNINGS;%(PreprocessorDefinitions);_WIN32_WINNT=0x0501;LUA_ANSI;ENABLE_CJSON_GLOBAL</PreprocessorDefinitions>
-       <PrecompiledHeader>NotUsing</PrecompiledHeader>
--      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
-       <DisableSpecificWarnings>4244;4018</DisableSpecificWarnings>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <GenerateDebugInformation>true</GenerateDebugInformation>
-diff --git a/src/Win32_Interop/Win32_ANSI.c b/src/Win32_Interop/Win32_ANSI.c
-index 404b84f..e7c55d2
---- a/src/Win32_Interop/Win32_ANSI.c
-+++ b/src/Win32_Interop/Win32_ANSI.c
-@@ -737,7 +737,7 @@ void ANSI_printf(char *format, ...) {
-     memset(buffer, 0, cBufLen);
- 
-     va_start(args, format);
--    retVal = vsprintf_s(buffer, cBufLen, format, args);
-+    retVal = vsnprintf(buffer, cBufLen - 1, format, args);
-     va_end(args);
- 
-     if (retVal > 0) {
-diff --git a/src/Win32_Interop/Win32_EventLog.cpp b/src/Win32_Interop/Win32_EventLog.cpp
-index 1856540..3db4ddd
---- a/src/Win32_Interop/Win32_EventLog.cpp
-+++ b/src/Win32_Interop/Win32_EventLog.cpp
-@@ -30,7 +30,6 @@ using namespace std;
- 
- #include "Win32_EventLog.h"
- #include "Win32_SmartHandle.h"
--#include "EventLog.h"
- 
- static bool eventLogEnabled = true;
- static string eventLogIdentity = "redis";
-@@ -129,17 +128,17 @@ void RedisEventLog::LogMessage(LPCSTR msg, const WORD type) {
-     DWORD eventID;
-     switch (type) {
-         case EVENTLOG_ERROR_TYPE:
--            eventID = MSG_ERROR_1;
-+            eventID = 0x2;
-             break;
-         case EVENTLOG_WARNING_TYPE:
--            eventID = MSG_WARNING_1;
-+            eventID = 0x1;
-             break;
-         case EVENTLOG_INFORMATION_TYPE:
--            eventID = MSG_INFO_1;
-+            eventID = 0x0;
-             break;
-         default:
-             std::cerr << "Unrecognized type: " << type << "\n";
--            eventID = MSG_INFO_1;
-+            eventID = 0x0;
-             break;
-     }
- 
-diff --git a/src/Win32_Interop/Win32_FDAPI.cpp b/src/Win32_Interop/Win32_FDAPI.cpp
-index 3df9af1..f60e3d4
---- a/src/Win32_Interop/Win32_FDAPI.cpp
-+++ b/src/Win32_Interop/Win32_FDAPI.cpp
-@@ -46,11 +46,13 @@ fdapi_access access = NULL;
- fdapi_bind bind = NULL;
- fdapi_connect connect = NULL;
- fdapi_fcntl fcntl = NULL;
-+fdapi_ioctl ioctl = NULL;
- fdapi_fstat fdapi_fstat64 = NULL;
- fdapi_fsync fsync = NULL;
- fdapi_ftruncate ftruncate = NULL;
- fdapi_freeaddrinfo freeaddrinfo = NULL;
- fdapi_getaddrinfo getaddrinfo = NULL;
-+fdapi_gethostbyname gethostbyname = NULL;
- fdapi_getpeername getpeername = NULL;
- fdapi_getsockname getsockname = NULL;
- fdapi_getsockopt getsockopt = NULL;
-@@ -67,7 +69,9 @@ fdapi_open open = NULL;
- fdapi_pipe pipe = NULL;
- fdapi_poll poll = NULL;
- fdapi_read read = NULL;
-+fdapi_recv recv = NULL;
- fdapi_select select = NULL;
-+fdapi_send send = NULL;
- fdapi_setsockopt setsockopt = NULL;
- fdapi_socket socket = NULL;
- fdapi_write write = NULL;
-@@ -622,6 +626,23 @@ int FDAPI_fcntl(int rfd, int cmd, int flags = 0 ) {
-     return -1;
- }
- 
-+int FDAPI_ioctl(int rfd, int cmd, char *buf) {
-+    try {
-+        SocketInfo* socket_info = RFDMap::getInstance().lookupSocketInfo(rfd);
-+        if (socket_info != NULL && socket_info->socket != INVALID_SOCKET) {
-+            if (f_ioctlsocket(socket_info->socket, cmd, (u_long *)buf) != SOCKET_ERROR) {
-+                return 0;
-+            } else {
-+                errno = f_WSAGetLastError();
-+                return -1;
-+            }
-+        }
-+    } CATCH_AND_REPORT();
-+
-+    errno = EBADF;
-+    return -1;
-+}
-+
- int FDAPI_poll(struct pollfd *fds, nfds_t nfds, int timeout) {
-     try {
-         struct pollfd* pollCopy = new struct pollfd[nfds];
-@@ -777,6 +798,42 @@ ssize_t FDAPI_read(int rfd, void *buf, size_t count) {
-     return -1;
- }
- 
-+ssize_t FDAPI_recv(int rfd, void *buf, size_t count, int flags) {
-+    try {
-+        SOCKET socket = RFDMap::getInstance().lookupSocket(rfd);
-+        if (socket != INVALID_SOCKET) {
-+            int retval = f_recv(socket, (char*) buf, (unsigned int) count, flags);
-+            if (retval == -1) {
-+                errno = GetLastError();
-+                if (errno == WSAEWOULDBLOCK) {
-+                    errno = EAGAIN;
-+                }
-+            }
-+            return retval;
-+        }
-+    } CATCH_AND_REPORT();
-+    errno = EBADF;
-+    return -1;
-+}
-+
-+ssize_t FDAPI_send(int rfd, const void *buf, size_t count, int flags) {
-+    try {
-+        SOCKET socket = RFDMap::getInstance().lookupSocket(rfd);
-+        if (socket != INVALID_SOCKET) {
-+            int retval = f_send(socket, (const char*) buf, (unsigned int) count, flags);
-+            if (retval == -1) {
-+                errno = GetLastError();
-+                if (errno == WSAEWOULDBLOCK) {
-+                    errno = EAGAIN;
-+                }
-+            }
-+            return retval;
-+        }
-+    } CATCH_AND_REPORT();
-+    errno = EBADF;
-+    return -1;
-+}
-+
- ssize_t FDAPI_write(int rfd, const void *buf, size_t count) {
-     try {
-         SOCKET socket = RFDMap::getInstance().lookupSocket(rfd);
-@@ -1195,12 +1252,14 @@ private:
-         bind = FDAPI_bind;
-         connect = FDAPI_connect;
-         fcntl = FDAPI_fcntl;
-+        ioctl = FDAPI_ioctl;
-         fdapi_fstat64 = (fdapi_fstat) FDAPI_fstat64;
-         freeaddrinfo = FDAPI_freeaddrinfo;
-         fsync = FDAPI_fsync;
-         ftruncate = FDAPI_ftruncate;
-         getaddrinfo = FDAPI_getaddrinfo;
-         getsockopt = FDAPI_getsockopt;
-+        gethostbyname = FDAPI_gethostbyname;
-         getpeername = FDAPI_getpeername;
-         getsockname = FDAPI_getsockname;
-         htonl = FDAPI_htonl;
-@@ -1216,9 +1275,11 @@ private:
-         pipe = FDAPI_pipe;
-         poll = FDAPI_poll;
-         read = FDAPI_read;
-+        recv = FDAPI_recv;
-         select = FDAPI_select;
-         setsockopt = FDAPI_setsockopt;
-         socket = FDAPI_socket;
-+        send = FDAPI_send;
-         write = FDAPI_write;
-     }
- 
-diff --git a/src/Win32_Interop/Win32_FDAPI.h b/src/Win32_Interop/Win32_FDAPI.h
-index 8fae9c7..6e09596
---- a/src/Win32_Interop/Win32_FDAPI.h
-+++ b/src/Win32_Interop/Win32_FDAPI.h
-@@ -116,9 +116,12 @@ typedef int (*fdapi_open)(const char * _Filename, int _OpenFlag, int flags);
- typedef int (*fdapi_accept)(int sockfd, struct sockaddr *addr, socklen_t *addrlen);
- typedef int (*fdapi_setsockopt)(int sockfd, int level, int optname,const void *optval, socklen_t optlen);
- typedef int (*fdapi_fcntl)(int fd, int cmd, int flags);
-+typedef int (*fdapi_ioctl)(int fd, int cmd, char *buf);
- typedef int (*fdapi_poll)(struct pollfd *fds, nfds_t nfds, int timeout);
- typedef int (*fdapi_getsockopt)(int sockfd, int level, int optname, void *optval, socklen_t *optlen);
- typedef int (*fdapi_connect)(int sockfd, const struct sockaddr *addr, size_t addrlen);
-+typedef ssize_t (*fdapi_recv)(int fd, void *buf, size_t count, int flags);
-+typedef ssize_t (*fdapi_send)(int rfd, void const *buf, size_t count, int flags);
- typedef ssize_t (*fdapi_read)(int fd, void *buf, size_t count);
- typedef ssize_t (*fdapi_write)(int fd, const void *buf, size_t count);
- typedef int (*fdapi_fsync)(int fd);
-@@ -128,6 +131,7 @@ typedef int (*fdapi_bind)(int sockfd, const struct sockaddr *addr, socklen_t add
- typedef u_short (*fdapi_htons)(u_short hostshort);
- typedef u_long (*fdapi_htonl)(u_long hostlong);
- typedef u_short (*fdapi_ntohs)(u_short netshort);
-+typedef struct hostent* (*fdapi_gethostbyname)(const char *name);
- typedef int (*fdapi_getpeername)(int sockfd, struct sockaddr *addr, socklen_t * addrlen);
- typedef int (*fdapi_getsockname)(int sockfd, struct sockaddr* addrsock, int* addrlen );
- typedef void (*fdapi_freeaddrinfo)(struct addrinfo *ai);
-@@ -159,12 +163,14 @@ extern fdapi_access         access;
- extern fdapi_bind           bind;
- extern fdapi_connect        connect;
- extern fdapi_fcntl          fcntl;
-+extern fdapi_ioctl          ioctl;
- extern fdapi_fstat          fdapi_fstat64;
- extern fdapi_freeaddrinfo   freeaddrinfo;
- extern fdapi_fsync          fsync;
- extern fdapi_ftruncate      ftruncate;
- extern fdapi_getaddrinfo    getaddrinfo;
- extern fdapi_getsockopt     getsockopt;
-+extern fdapi_gethostbyname  gethostbyname;
- extern fdapi_getpeername    getpeername;
- extern fdapi_getsockname    getsockname;
- extern fdapi_htonl          htonl;
-@@ -180,7 +186,9 @@ extern fdapi_open           open;
- extern fdapi_pipe           pipe;
- extern fdapi_poll           poll;
- extern fdapi_read           read;
-+extern fdapi_recv           recv;
- extern fdapi_select         select;
-+extern fdapi_send           send;
- extern fdapi_setsockopt     setsockopt;
- extern fdapi_socket         socket;
- extern fdapi_write          write;
-diff --git a/src/Win32_Interop/Win32_Interop.vcxproj b/src/Win32_Interop/Win32_Interop.vcxproj
-index 93fc44b..b75d89b
---- a/src/Win32_Interop/Win32_Interop.vcxproj
-+++ b/src/Win32_Interop/Win32_Interop.vcxproj
-@@ -74,35 +74,6 @@
-     <ClInclude Include="win32_wsiocp2.h" />
-     <ClInclude Include="WS2tcpip.h" />
-   </ItemGroup>
--  <ItemGroup>
--    <CustomBuild Include="EventLog.mc">
--      <FileType>Document</FileType>
--      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">md resources
--mc.exe -A -b -c -h . -r resources EventLog.mc
--rc.exe -foresources/EventLog.res resources/EventLog.rc
--link.exe -dll -noentry resources/EventLog.res -out:$(TargetDir)EventLog.dll
--</Command>
--      <Command Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">md resources
--mc.exe -A -b -c -h . -r resources EventLog.mc
--rc.exe -foresources/EventLog.res resources/EventLog.rc
--link.exe -dll -noentry resources/EventLog.res -out:$(TargetDir)EventLog.dll
--</Command>
--      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">EventLog.h</Outputs>
--      <Outputs Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">EventLog.h</Outputs>
--      <Command Condition="'$(Configuration)|$(Platform)'=='Release|x64'">md resources
--mc.exe -A -b -c -h . -r resources EventLog.mc
--rc.exe -foresources/EventLog.res resources/EventLog.rc
--link.exe -dll -noentry resources/EventLog.res -out:$(TargetDir)EventLog.dll
--</Command>
--      <Command Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">md resources
--mc.exe -A -b -c -h . -r resources EventLog.mc
--rc.exe -foresources/EventLog.res resources/EventLog.rc
--link.exe -dll -noentry resources/EventLog.res -out:$(TargetDir)EventLog.dll
--</Command>
--      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|x64'">EventLog.h</Outputs>
--      <Outputs Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">EventLog.h</Outputs>
--    </CustomBuild>
--  </ItemGroup>
-   <PropertyGroup Label="Globals">
-     <ProjectGuid>{8C07F811-C81C-432C-B334-1AE6FAECF951}</ProjectGuid>
-     <Keyword>Win32Proj</Keyword>
-@@ -113,27 +84,25 @@ link.exe -dll -noentry resources/EventLog.res -out:$(TargetDir)EventLog.dll
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'" Label="Configuration">
-     <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>true</UseDebugLibraries>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-     <CharacterSet>Unicode</CharacterSet>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'" Label="Configuration">
-     <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>true</UseDebugLibraries>
--    <PlatformToolset>v120</PlatformToolset>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-     <CharacterSet>Unicode</CharacterSet>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|x64'" Label="Configuration">
-     <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>false</UseDebugLibraries>
--    <PlatformToolset>v120</PlatformToolset>
--    <WholeProgramOptimization>true</WholeProgramOptimization>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-     <CharacterSet>Unicode</CharacterSet>
-   </PropertyGroup>
-   <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'" Label="Configuration">
-     <ConfigurationType>StaticLibrary</ConfigurationType>
-     <UseDebugLibraries>false</UseDebugLibraries>
--    <PlatformToolset>v120</PlatformToolset>
--    <WholeProgramOptimization>true</WholeProgramOptimization>
-+    <PlatformToolset>v140_xp</PlatformToolset>
-     <CharacterSet>Unicode</CharacterSet>
-   </PropertyGroup>
-   <Import Project="$(VCTargetsPath)\Microsoft.Cpp.props" />
-@@ -152,13 +121,9 @@ link.exe -dll -noentry resources/EventLog.res -out:$(TargetDir)EventLog.dll
-     <Import Project="$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props" Condition="exists('$(UserRootDir)\Microsoft.Cpp.$(Platform).user.props')" Label="LocalAppDataPlatform" />
-   </ImportGroup>
-   <PropertyGroup Label="UserMacros" />
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Debug|Win32'">
--    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
--    <IntDir>$(Platform)\$(Configuration)\</IntDir>
--  </PropertyGroup>
--  <PropertyGroup Condition="'$(Configuration)|$(Platform)'=='Release|Win32'">
--    <OutDir>$(SolutionDir)$(Platform)\$(Configuration)\</OutDir>
--    <IntDir>$(Platform)\$(Configuration)\</IntDir>
-+  <PropertyGroup>
-+    <OutDir>$(SolutionDir)build\$(Platform)\$(Configuration)\</OutDir>
-+    <IntDir>$(SolutionDir)build\$(Platform)\$(Configuration)\$(MSBuildProjectName)\</IntDir>
-   </PropertyGroup>
-   <ItemDefinitionGroup Condition="'$(Configuration)|$(Platform)'=='Debug|x64'">
-     <ClCompile>
-@@ -166,9 +131,10 @@ link.exe -dll -noentry resources/EventLog.res -out:$(TargetDir)EventLog.dll
-       </PrecompiledHeader>
-       <WarningLevel>Level3</WarningLevel>
-       <Optimization>Disabled</Optimization>
--      <PreprocessorDefinitions>USE_STATIC;USE_JEMALLOC;_OFF_T_DEFINED;WIN32;_DEBUG;_LIB;%(PreprocessorDefinitions);LACKS_STDLIB_H;_CRT_SECURE_NO_WARNINGS;PSAPI_VERSION=1</PreprocessorDefinitions>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;USE_STATIC;USE_JEMALLOC;_OFF_T_DEFINED;_NO_CRT_STDIO_INLINE;_CRT_SECURE_NO_DEPRECATE;WIN32;_DEBUG;_LIB;%(PreprocessorDefinitions);LACKS_STDLIB_H;_CRT_SECURE_NO_WARNINGS;PSAPI_VERSION=1</PreprocessorDefinitions>
-       <AdditionalIncludeDirectories>$(ProjectDir)..\..\deps\lua\src;$(ProjectDir)..\..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
--      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
-+      <MinimalRebuild>false</MinimalRebuild>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <SubSystem>Windows</SubSystem>
-@@ -186,9 +152,10 @@ link.exe -dll -noentry resources/EventLog.res -out:$(TargetDir)EventLog.dll
-       </PrecompiledHeader>
-       <WarningLevel>Level3</WarningLevel>
-       <Optimization>Disabled</Optimization>
--      <PreprocessorDefinitions>USE_STATIC;USE_JEMALLOC;_OFF_T_DEFINED;WIN32;_DEBUG;_LIB;%(PreprocessorDefinitions);LACKS_STDLIB_H;_CRT_SECURE_NO_WARNINGS;PSAPI_VERSION=1;_WIN32_WINNT=0x0501</PreprocessorDefinitions>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;USE_STATIC;USE_JEMALLOC;_OFF_T_DEFINED;_NO_CRT_STDIO_INLINE;_CRT_SECURE_NO_DEPRECATE;WIN32;_DEBUG;_LIB;%(PreprocessorDefinitions);LACKS_STDLIB_H;_CRT_SECURE_NO_WARNINGS;PSAPI_VERSION=1;_WIN32_WINNT=0x0501</PreprocessorDefinitions>
-       <AdditionalIncludeDirectories>$(ProjectDir)..\..\deps\lua\src;$(ProjectDir)..\..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
--      <RuntimeLibrary>MultiThreadedDebug</RuntimeLibrary>
-+      <MinimalRebuild>false</MinimalRebuild>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <SubSystem>Windows</SubSystem>
-@@ -211,10 +178,9 @@ link.exe -dll -noentry resources/EventLog.res -out:$(TargetDir)EventLog.dll
-       <Optimization>Full</Optimization>
-       <FunctionLevelLinking>true</FunctionLevelLinking>
-       <IntrinsicFunctions>true</IntrinsicFunctions>
--      <PreprocessorDefinitions>USE_STATIC;USE_JEMALLOC;_OFF_T_DEFINED;WIN32;NDEBUG;_LIB;%(PreprocessorDefinitions);LACKS_STDLIB_H;_CRT_SECURE_NO_WARNINGS;PSAPI_VERSION=1</PreprocessorDefinitions>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;USE_STATIC;USE_JEMALLOC;_OFF_T_DEFINED;_NO_CRT_STDIO_INLINE;_CRT_SECURE_NO_DEPRECATE;WIN32;NDEBUG;_LIB;%(PreprocessorDefinitions);LACKS_STDLIB_H;_CRT_SECURE_NO_WARNINGS;PSAPI_VERSION=1</PreprocessorDefinitions>
-       <AdditionalIncludeDirectories>$(ProjectDir)..\..\deps\lua\src;$(ProjectDir)..\..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
--      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
--      <WholeProgramOptimization>true</WholeProgramOptimization>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <SubSystem>Windows</SubSystem>
-@@ -235,9 +201,9 @@ link.exe -dll -noentry resources/EventLog.res -out:$(TargetDir)EventLog.dll
-       <Optimization>MaxSpeed</Optimization>
-       <FunctionLevelLinking>true</FunctionLevelLinking>
-       <IntrinsicFunctions>true</IntrinsicFunctions>
--      <PreprocessorDefinitions>USE_STATIC;USE_JEMALLOC;_OFF_T_DEFINED;WIN32;NDEBUG;_LIB;%(PreprocessorDefinitions);LACKS_STDLIB_H;_CRT_SECURE_NO_WARNINGS;PSAPI_VERSION=1;_WIN32_WINNT=0x0501</PreprocessorDefinitions>
-+      <PreprocessorDefinitions>_WIN32_WINNT=0x0502;USE_STATIC;USE_JEMALLOC;_OFF_T_DEFINED;_NO_CRT_STDIO_INLINE;_CRT_SECURE_NO_DEPRECATE;WIN32;NDEBUG;_LIB;%(PreprocessorDefinitions);LACKS_STDLIB_H;_CRT_SECURE_NO_WARNINGS;PSAPI_VERSION=1;_WIN32_WINNT=0x0501</PreprocessorDefinitions>
-       <AdditionalIncludeDirectories>$(ProjectDir)..\..\deps\lua\src;$(ProjectDir)..\..\deps\jemalloc-win\include</AdditionalIncludeDirectories>
--      <RuntimeLibrary>MultiThreaded</RuntimeLibrary>
-+      <MultiProcessorCompilation>true</MultiProcessorCompilation>
-     </ClCompile>
-     <Link>
-       <SubSystem>Windows</SubSystem>
-diff --git a/src/Win32_Interop/Win32_service.cpp b/src/Win32_Interop/Win32_service.cpp
-index 488538e..1c33f53
---- a/src/Win32_Interop/Win32_service.cpp
-+++ b/src/Win32_Interop/Win32_service.cpp
-@@ -59,7 +59,6 @@ this should preceed the other arguments passed to redis. For instance:
- #include <windowsx.h>
- #include <shlobj.h>
- #include <tchar.h>
--#include <strsafe.h>
- #include <aclapi.h>
- #include "Win32_EventLog.h"
- #include <algorithm>
-diff --git a/src/ziplist.c b/src/ziplist.c
-index 24b0a7c..29d445d
---- a/src/ziplist.c
-+++ b/src/ziplist.c
-@@ -920,7 +920,7 @@ void ziplistRepr(unsigned char *zl) {
-         entry = zipEntry(p);
-         printf(
-             "{"
--                "addr 0x%08lx, "    /* TODO" verify 0x%08lx */
-+                "addr %p, "
-                 "index %2d, "
-                 "offset %5ld, "
-                 "rl: %5u, "
-@@ -929,9 +929,9 @@ void ziplistRepr(unsigned char *zl) {
-                 "pls: %2u, "
-                 "payload %5u"
-             "} ",
--            (PORT_ULONG)p,
-+            (void *)p,
-             index,
--            (PORT_ULONG)(p-zl),
-+            (long)(p-zl),
-             entry.headersize+entry.len,
-             entry.headersize,
-             entry.prevrawlen,
diff --git a/src/global_scheduler/CMakeLists.txt b/src/global_scheduler/CMakeLists.txt
deleted file mode 100644
index fec7ec2810d9c..0000000000000
--- a/src/global_scheduler/CMakeLists.txt
+++ /dev/null
@@ -1,14 +0,0 @@
-cmake_minimum_required(VERSION 3.4)
-
-project(global_scheduler)
-
-include_directories(${CMAKE_CURRENT_LIST_DIR})
-
-set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Werror -Wall")
-
-add_executable(global_scheduler global_scheduler.cc global_scheduler_algorithm.cc)
-
-# Make sure ${HIREDIS_LIB} is ready before linking.
-add_dependencies(global_scheduler hiredis common)
-
-target_link_libraries(global_scheduler common ${HIREDIS_LIB} ray_static ${PLASMA_STATIC_LIB} ${ARROW_STATIC_LIB} ${Boost_SYSTEM_LIBRARY} pthread)
diff --git a/src/global_scheduler/global_scheduler.cc b/src/global_scheduler/global_scheduler.cc
deleted file mode 100644
index 069ad6865d174..0000000000000
--- a/src/global_scheduler/global_scheduler.cc
+++ /dev/null
@@ -1,492 +0,0 @@
-#include <getopt.h>
-#include <signal.h>
-#include <stdlib.h>
-
-#include "common.h"
-#include "event_loop.h"
-#include "global_scheduler.h"
-#include "global_scheduler_algorithm.h"
-#include "net.h"
-#include "ray/util/util.h"
-#include "state/db_client_table.h"
-#include "state/local_scheduler_table.h"
-#include "state/object_table.h"
-#include "state/table.h"
-#include "state/task_table.h"
-
-/**
- * Retry the task assignment. If the local scheduler that the task is assigned
- * to is no longer active, do not retry the assignment.
- * TODO(rkn): We currently only retry the method if the global scheduler
- * publishes a task to a local scheduler before the local scheduler has
- * subscribed to the channel. If we enforce that ordering, we can remove this
- * retry method.
- *
- * @param id The task ID.
- * @param user_context The global scheduler state.
- * @param user_data The Task that failed to be assigned.
- * @return Void.
- */
-void assign_task_to_local_scheduler_retry(UniqueID id,
-                                          void *user_context,
-                                          void *user_data) {
-  GlobalSchedulerState *state = (GlobalSchedulerState *) user_context;
-  Task *task = (Task *) user_data;
-  RAY_CHECK(Task_state(task) == TaskStatus::SCHEDULED);
-
-  // If the local scheduler has died since we requested the task assignment, do
-  // not retry again.
-  DBClientID local_scheduler_id = Task_local_scheduler(task);
-  auto it = state->local_schedulers.find(local_scheduler_id);
-  if (it == state->local_schedulers.end()) {
-    return;
-  }
-
-  // The local scheduler is still alive. The failure is most likely due to the
-  // task assignment getting published before the local scheduler subscribed to
-  // the channel. Retry the assignment.
-  auto retryInfo = RetryInfo{
-      .num_retries = 0,  // This value is unused.
-      .timeout = 0,      // This value is unused.
-      .fail_callback = assign_task_to_local_scheduler_retry,
-  };
-  task_table_update(state->db, Task_copy(task), &retryInfo, NULL, user_context);
-}
-
-/**
- * Assign the given task to the local scheduler, update Redis and scheduler data
- * structures.
- *
- * @param state Global scheduler state.
- * @param task Task to be assigned to the local scheduler.
- * @param local_scheduler_id DB client ID for the local scheduler.
- * @return Void.
- */
-void assign_task_to_local_scheduler(GlobalSchedulerState *state,
-                                    Task *task,
-                                    DBClientID local_scheduler_id) {
-  TaskSpec *spec = Task_task_execution_spec(task)->Spec();
-  RAY_LOG(DEBUG) << "assigning task to local_scheduler_id = "
-                 << local_scheduler_id;
-  Task_set_state(task, TaskStatus::SCHEDULED);
-  Task_set_local_scheduler(task, local_scheduler_id);
-  RAY_LOG(DEBUG) << "Issuing a task table update for task = "
-                 << Task_task_id(task);
-
-  auto retryInfo = RetryInfo{
-      .num_retries = 0,  // This value is unused.
-      .timeout = 0,      // This value is unused.
-      .fail_callback = assign_task_to_local_scheduler_retry,
-  };
-  task_table_update(state->db, Task_copy(task), &retryInfo, NULL, state);
-
-  /* Update the object table info to reflect the fact that the results of this
-   * task will be created on the machine that the task was assigned to. This can
-   * be used to improve locality-aware scheduling. */
-  for (int64_t i = 0; i < TaskSpec_num_returns(spec); ++i) {
-    ObjectID return_id = TaskSpec_return(spec, i);
-    if (state->scheduler_object_info_table.find(return_id) ==
-        state->scheduler_object_info_table.end()) {
-      SchedulerObjectInfo &obj_info_entry =
-          state->scheduler_object_info_table[return_id];
-      /* The value -1 indicates that the size of the object is not known yet. */
-      obj_info_entry.data_size = -1;
-    }
-    RAY_CHECK(state->local_scheduler_plasma_map.count(local_scheduler_id) == 1);
-    state->scheduler_object_info_table[return_id].object_locations.push_back(
-        state->local_scheduler_plasma_map[local_scheduler_id]);
-  }
-
-  /* TODO(rkn): We should probably pass around local_scheduler struct pointers
-   * instead of db_client_id objects. */
-  /* Update the local scheduler info. */
-  auto it = state->local_schedulers.find(local_scheduler_id);
-  RAY_CHECK(it != state->local_schedulers.end());
-
-  LocalScheduler &local_scheduler = it->second;
-  local_scheduler.num_tasks_sent += 1;
-  local_scheduler.num_recent_tasks_sent += 1;
-  // Resource accounting update for this local scheduler.
-  for (auto const &resource_pair : TaskSpec_get_required_resources(spec)) {
-    std::string resource_name = resource_pair.first;
-    double resource_quantity = resource_pair.second;
-    // The local scheduler must have this resource because otherwise we wouldn't
-    // be assigning the task to this local scheduler.
-    RAY_CHECK(local_scheduler.info.dynamic_resources.count(resource_name) ==
-                  1 ||
-              resource_quantity == 0);
-    // Subtract task's resource from the cached dynamic resource capacity for
-    // this local scheduler. This will be overwritten on the next heartbeat.
-    local_scheduler.info.dynamic_resources[resource_name] =
-        MAX(0, local_scheduler.info.dynamic_resources[resource_name] -
-                   resource_quantity);
-  }
-}
-
-GlobalSchedulerState *GlobalSchedulerState_init(event_loop *loop,
-                                                const char *node_ip_address,
-                                                const char *redis_primary_addr,
-                                                int redis_primary_port) {
-  GlobalSchedulerState *state = new GlobalSchedulerState();
-  state->loop = loop;
-  state->db = db_connect(std::string(redis_primary_addr), redis_primary_port,
-                         "global_scheduler", node_ip_address,
-                         std::vector<std::string>());
-  db_attach(state->db, loop, false);
-  state->policy_state = GlobalSchedulerPolicyState_init();
-  return state;
-}
-
-void GlobalSchedulerState_free(GlobalSchedulerState *state) {
-  db_disconnect(state->db);
-  state->local_schedulers.clear();
-  GlobalSchedulerPolicyState_free(state->policy_state);
-  /* Delete the plasma to local scheduler association map. */
-  state->plasma_local_scheduler_map.clear();
-
-  /* Delete the local scheduler to plasma association map. */
-  state->local_scheduler_plasma_map.clear();
-
-  /* Free the scheduler object info table. */
-  state->scheduler_object_info_table.clear();
-  /* Free the array of unschedulable tasks. */
-  int64_t num_pending_tasks = state->pending_tasks.size();
-  if (num_pending_tasks > 0) {
-    RAY_LOG(WARNING) << "There are " << num_pending_tasks
-                     << " remaining tasks in the pending tasks array.";
-  }
-  for (int i = 0; i < num_pending_tasks; ++i) {
-    Task *pending_task = state->pending_tasks[i];
-    Task_free(pending_task);
-  }
-  state->pending_tasks.clear();
-
-  /* Destroy the event loop. */
-  destroy_outstanding_callbacks(state->loop);
-  event_loop_destroy(state->loop);
-  state->loop = NULL;
-
-  /* Free the global scheduler state. */
-  delete state;
-}
-
-/* We need this code so we can clean up when we get a SIGTERM signal. */
-
-GlobalSchedulerState *g_state;
-
-void signal_handler(int signal) {
-  if (signal == SIGTERM) {
-    GlobalSchedulerState_free(g_state);
-    exit(0);
-  }
-}
-
-/* End of the cleanup code. */
-
-void process_task_waiting(Task *waiting_task, void *user_context) {
-  GlobalSchedulerState *state = (GlobalSchedulerState *) user_context;
-  RAY_LOG(DEBUG) << "Task waiting callback is called.";
-  bool successfully_assigned =
-      handle_task_waiting(state, state->policy_state, waiting_task);
-  /* If the task was not successfully submitted to a local scheduler, add the
-   * task to the array of pending tasks. The global scheduler will periodically
-   * resubmit the tasks in this array. */
-  if (!successfully_assigned) {
-    Task *task_copy = Task_copy(waiting_task);
-    state->pending_tasks.push_back(task_copy);
-  }
-}
-
-void add_local_scheduler(GlobalSchedulerState *state,
-                         DBClientID db_client_id,
-                         const char *manager_address) {
-  /* Add plasma_manager ip:port -> local_scheduler_db_client_id association to
-   * state. */
-  state->plasma_local_scheduler_map[std::string(manager_address)] =
-      db_client_id;
-
-  /* Add local_scheduler_db_client_id -> plasma_manager ip:port association to
-   * state. */
-  state->local_scheduler_plasma_map[db_client_id] =
-      std::string(manager_address);
-
-  /* Add new local scheduler to the state. */
-  LocalScheduler &local_scheduler = state->local_schedulers[db_client_id];
-  local_scheduler.id = db_client_id;
-  local_scheduler.num_heartbeats_missed = 0;
-  local_scheduler.num_tasks_sent = 0;
-  local_scheduler.num_recent_tasks_sent = 0;
-  local_scheduler.info.task_queue_length = 0;
-  local_scheduler.info.available_workers = 0;
-
-  /* Allow the scheduling algorithm to process this event. */
-  handle_new_local_scheduler(state, state->policy_state, db_client_id);
-}
-
-std::unordered_map<DBClientID, LocalScheduler>::iterator remove_local_scheduler(
-    GlobalSchedulerState *state,
-    std::unordered_map<DBClientID, LocalScheduler>::iterator it) {
-  RAY_CHECK(it != state->local_schedulers.end());
-  DBClientID local_scheduler_id = it->first;
-  it = state->local_schedulers.erase(it);
-
-  /* Remove the local scheduler from the mappings. This code only makes sense if
-   * there is a one-to-one mapping between local schedulers and plasma managers.
-   */
-  std::string manager_address =
-      state->local_scheduler_plasma_map[local_scheduler_id];
-  state->local_scheduler_plasma_map.erase(local_scheduler_id);
-  state->plasma_local_scheduler_map.erase(manager_address);
-
-  handle_local_scheduler_removed(state, state->policy_state,
-                                 local_scheduler_id);
-  return it;
-}
-
-/**
- * Process a notification about a new DB client connecting to Redis.
- *
- * @param manager_address An ip:port pair for the plasma manager associated with
- *        this db client.
- * @return Void.
- */
-void process_new_db_client(DBClient *db_client, void *user_context) {
-  GlobalSchedulerState *state = (GlobalSchedulerState *) user_context;
-  RAY_LOG(DEBUG) << "db client table callback for db client = "
-                 << db_client->id;
-  if (strncmp(db_client->client_type.c_str(), "local_scheduler",
-              strlen("local_scheduler")) == 0) {
-    bool local_scheduler_present =
-        (state->local_schedulers.find(db_client->id) !=
-         state->local_schedulers.end());
-    if (db_client->is_alive) {
-      /* This is a notification for an insert. We may receive duplicate
-       * notifications since we read the entire table before processing
-       * notifications. Filter out local schedulers that we already added. */
-      if (!local_scheduler_present) {
-        add_local_scheduler(state, db_client->id,
-                            db_client->manager_address.c_str());
-      }
-    } else {
-      if (local_scheduler_present) {
-        remove_local_scheduler(state,
-                               state->local_schedulers.find(db_client->id));
-      }
-    }
-  }
-}
-
-/**
- * Process notification about the new object information.
- *
- * @param object_id ID of the object that the notification is about.
- * @param data_size The object size.
- * @param manager_count The number of locations for this object.
- * @param manager_ids The vector of Plasma Manager client IDs.
- * @param user_context The user context.
- * @return Void.
- */
-void object_table_subscribe_callback(ObjectID object_id,
-                                     int64_t data_size,
-                                     const std::vector<DBClientID> &manager_ids,
-                                     void *user_context) {
-  /* Extract global scheduler state from the callback context. */
-  GlobalSchedulerState *state = (GlobalSchedulerState *) user_context;
-  RAY_LOG(DEBUG) << "object table subscribe callback for OBJECT = "
-                 << object_id;
-
-  const std::vector<std::string> managers =
-      db_client_table_get_ip_addresses(state->db, manager_ids);
-  RAY_LOG(DEBUG) << "\tManagers<" << managers.size() << ">:";
-  for (size_t i = 0; i < managers.size(); i++) {
-    RAY_LOG(DEBUG) << "\t\t" << managers[i];
-  }
-
-  if (state->scheduler_object_info_table.find(object_id) ==
-      state->scheduler_object_info_table.end()) {
-    /* Construct a new object info hash table entry. */
-    SchedulerObjectInfo &obj_info_entry =
-        state->scheduler_object_info_table[object_id];
-    obj_info_entry.data_size = data_size;
-
-    RAY_LOG(DEBUG) << "New object added to object_info_table with id = "
-                   << object_id;
-    RAY_LOG(DEBUG) << "\tmanager locations:";
-    for (size_t i = 0; i < managers.size(); i++) {
-      RAY_LOG(DEBUG) << "\t\t" << managers[i];
-    }
-  }
-
-  SchedulerObjectInfo &obj_info_entry =
-      state->scheduler_object_info_table[object_id];
-
-  /* In all cases, replace the object location vector on each callback. */
-  obj_info_entry.object_locations.clear();
-  for (size_t i = 0; i < managers.size(); i++) {
-    obj_info_entry.object_locations.push_back(managers[i]);
-  }
-}
-
-void local_scheduler_table_handler(DBClientID client_id,
-                                   LocalSchedulerInfo info,
-                                   void *user_context) {
-  /* Extract global scheduler state from the callback context. */
-  GlobalSchedulerState *state = (GlobalSchedulerState *) user_context;
-  ARROW_UNUSED(state);
-  RAY_LOG(DEBUG) << "Local scheduler heartbeat from db_client_id " << client_id;
-  RAY_LOG(DEBUG) << "total workers = " << info.total_num_workers
-                 << ", task queue length = " << info.task_queue_length
-                 << ", available workers = " << info.available_workers;
-
-  /* Update the local scheduler info struct. */
-  auto it = state->local_schedulers.find(client_id);
-  if (it != state->local_schedulers.end()) {
-    if (info.is_dead) {
-      /* The local scheduler is exiting. Increase the number of heartbeats
-       * missed to the timeout threshold. This will trigger removal of the
-       * local scheduler the next time the timeout handler fires. */
-      it->second.num_heartbeats_missed =
-          RayConfig::instance().num_heartbeats_timeout();
-    } else {
-      /* Reset the number of tasks sent since the last heartbeat. */
-      LocalScheduler &local_scheduler = it->second;
-      local_scheduler.num_heartbeats_missed = 0;
-      local_scheduler.num_recent_tasks_sent = 0;
-      local_scheduler.info = info;
-    }
-  } else {
-    RAY_LOG(WARNING) << "client_id didn't match any cached local scheduler "
-                     << "entries";
-  }
-}
-
-int task_cleanup_handler(event_loop *loop, timer_id id, void *context) {
-  GlobalSchedulerState *state = (GlobalSchedulerState *) context;
-  /* Loop over the pending tasks in reverse order and resubmit them. */
-  auto it = state->pending_tasks.end();
-  while (it != state->pending_tasks.begin()) {
-    it--;
-    Task *pending_task = *it;
-    /* Pretend that the task has been resubmitted. */
-    bool successfully_assigned =
-        handle_task_waiting(state, state->policy_state, pending_task);
-    if (successfully_assigned) {
-      /* The task was successfully assigned, so remove it from this list and
-       * free it. This uses the fact that pending_tasks is a vector and so erase
-       * returns an iterator to the next element in the vector. */
-      it = state->pending_tasks.erase(it);
-      Task_free(pending_task);
-    }
-  }
-
-  return GLOBAL_SCHEDULER_TASK_CLEANUP_MILLISECONDS;
-}
-
-int heartbeat_timeout_handler(event_loop *loop, timer_id id, void *context) {
-  GlobalSchedulerState *state = (GlobalSchedulerState *) context;
-  /* Check for local schedulers that have missed a number of heartbeats. If any
-   * local schedulers have died, notify others so that the state can be cleaned
-   * up. */
-  /* TODO(swang): If the local scheduler hasn't actually died, then it should
-   * clean up its state and exit upon receiving this notification. */
-  auto it = state->local_schedulers.begin();
-  while (it != state->local_schedulers.end()) {
-    if (it->second.num_heartbeats_missed >=
-        RayConfig::instance().num_heartbeats_timeout()) {
-      RAY_LOG(WARNING) << "Missed too many heartbeats from local scheduler, "
-                       << "marking as dead.";
-      /* Notify others by updating the global state. */
-      db_client_table_remove(state->db, it->second.id, NULL, NULL, NULL);
-      /* Remove the scheduler from the local state. The call to
-       * remove_local_scheduler modifies the container in place and returns the
-       * next iterator. */
-      it = remove_local_scheduler(state, it);
-    } else {
-      it->second.num_heartbeats_missed += 1;
-      it++;
-    }
-  }
-
-  /* Reset the timer. */
-  return RayConfig::instance().heartbeat_timeout_milliseconds();
-}
-
-void start_server(const char *node_ip_address,
-                  const char *redis_primary_addr,
-                  int redis_primary_port) {
-  event_loop *loop = event_loop_create();
-  g_state = GlobalSchedulerState_init(loop, node_ip_address, redis_primary_addr,
-                                      redis_primary_port);
-  /* TODO(rkn): subscribe to notifications from the object table. */
-  /* Subscribe to notifications about new local schedulers. TODO(rkn): this
-   * needs to also get all of the clients that registered with the database
-   * before this call to subscribe. */
-  db_client_table_subscribe(g_state->db, process_new_db_client,
-                            (void *) g_state, NULL, NULL, NULL);
-  /* Subscribe to notifications about waiting tasks. If a local scheduler
-   * submits tasks to the global scheduler before the global scheduler
-   * successfully subscribes, then the local scheduler that submitted the tasks
-   * will retry. */
-  task_table_subscribe(g_state->db, UniqueID::nil(), TaskStatus::WAITING,
-                       process_task_waiting, (void *) g_state, NULL, NULL,
-                       NULL);
-
-  object_table_subscribe_to_notifications(g_state->db, true,
-                                          object_table_subscribe_callback,
-                                          g_state, NULL, NULL, NULL);
-  /* Subscribe to notifications from local schedulers. These notifications serve
-   * as heartbeats and contain informaion about the load on the local
-   * schedulers. */
-  local_scheduler_table_subscribe(g_state->db, local_scheduler_table_handler,
-                                  g_state, NULL);
-  /* Start a timer that periodically checks if there are queued tasks that can
-   * be scheduled. Currently this is only used to handle the special case in
-   * which a task is waiting and no node meets its static resource requirements.
-   * If a new node joins the cluster that does have enough resources, then this
-   * timer should notice and schedule the task. */
-  event_loop_add_timer(loop, GLOBAL_SCHEDULER_TASK_CLEANUP_MILLISECONDS,
-                       task_cleanup_handler, g_state);
-  event_loop_add_timer(loop,
-                       RayConfig::instance().heartbeat_timeout_milliseconds(),
-                       heartbeat_timeout_handler, g_state);
-  /* Start the event loop. */
-  event_loop_run(loop);
-}
-
-int main(int argc, char *argv[]) {
-  InitShutdownRAII ray_log_shutdown_raii(
-      ray::RayLog::StartRayLog, ray::RayLog::ShutDownRayLog, argv[0], RAY_INFO,
-      /*log_dir=*/"");
-  ray::RayLog::InstallFailureSignalHandler();
-  signal(SIGTERM, signal_handler);
-  /* IP address and port of the primary redis instance. */
-  char *redis_primary_addr_port = NULL;
-  /* The IP address of the node that this global scheduler is running on. */
-  char *node_ip_address = NULL;
-  int c;
-  while ((c = getopt(argc, argv, "h:r:")) != -1) {
-    switch (c) {
-    case 'r':
-      redis_primary_addr_port = optarg;
-      break;
-    case 'h':
-      node_ip_address = optarg;
-      break;
-    default:
-      RAY_LOG(FATAL) << "unknown option " << c;
-    }
-  }
-
-  char redis_primary_addr[16];
-  int redis_primary_port = -1;
-  if (!redis_primary_addr_port ||
-      parse_ip_addr_port(redis_primary_addr_port, redis_primary_addr,
-                         &redis_primary_port) == -1) {
-    RAY_LOG(FATAL) << "specify the primary redis address like 127.0.0.1:6379 "
-                   << "with the -r switch";
-  }
-  if (!node_ip_address) {
-    RAY_LOG(FATAL) << "specify the node IP address with the -h switch";
-  }
-  start_server(node_ip_address, redis_primary_addr, redis_primary_port);
-}
diff --git a/src/global_scheduler/global_scheduler.h b/src/global_scheduler/global_scheduler.h
deleted file mode 100644
index e1610c555088c..0000000000000
--- a/src/global_scheduler/global_scheduler.h
+++ /dev/null
@@ -1,94 +0,0 @@
-#ifndef GLOBAL_SCHEDULER_H
-#define GLOBAL_SCHEDULER_H
-
-#include "task.h"
-
-#include <unordered_map>
-
-#include "ray/gcs/client.h"
-#include "state/db.h"
-#include "state/local_scheduler_table.h"
-
-/* The frequency with which the global scheduler checks if there are any tasks
- * that haven't been scheduled yet. */
-#define GLOBAL_SCHEDULER_TASK_CLEANUP_MILLISECONDS 100
-
-/** Contains all information that is associated with a local scheduler. */
-typedef struct {
-  /** The ID of the local scheduler in Redis. */
-  DBClientID id;
-  /** The number of heartbeat intervals that have passed since we last heard
-   *  from this local scheduler. */
-  int64_t num_heartbeats_missed;
-  /** The number of tasks sent from the global scheduler to this local
-   *  scheduler. */
-  int64_t num_tasks_sent;
-  /** The number of tasks sent from the global scheduler to this local scheduler
-   *  since the last heartbeat arrived. */
-  int64_t num_recent_tasks_sent;
-  /** The latest information about the local scheduler capacity. This is updated
-   *  every time a new local scheduler heartbeat arrives. */
-  LocalSchedulerInfo info;
-} LocalScheduler;
-
-typedef class GlobalSchedulerPolicyState GlobalSchedulerPolicyState;
-
-/**
- * This defines a hash table used to cache information about different objects.
- */
-typedef struct {
-  /** The size in bytes of the object. */
-  int64_t data_size;
-  /** A vector of object locations for this object. */
-  std::vector<std::string> object_locations;
-} SchedulerObjectInfo;
-
-/**
- * Global scheduler state structure.
- */
-typedef struct {
-  /** The global scheduler event loop. */
-  event_loop *loop;
-  /** The global state store database. */
-  DBHandle *db;
-  /** A hash table mapping local scheduler ID to the local schedulers that are
-   *  connected to Redis. */
-  std::unordered_map<DBClientID, LocalScheduler> local_schedulers;
-  /** The state managed by the scheduling policy. */
-  GlobalSchedulerPolicyState *policy_state;
-  /** The plasma_manager ip:port -> local_scheduler_db_client_id association. */
-  std::unordered_map<std::string, DBClientID> plasma_local_scheduler_map;
-  /** The local_scheduler_db_client_id -> plasma_manager ip:port association. */
-  std::unordered_map<DBClientID, std::string> local_scheduler_plasma_map;
-  /** Objects cached by this global scheduler instance. */
-  std::unordered_map<ObjectID, SchedulerObjectInfo> scheduler_object_info_table;
-  /** An array of tasks that haven't been scheduled yet. */
-  std::vector<Task *> pending_tasks;
-} GlobalSchedulerState;
-
-/**
- * This is a helper method to look up the local scheduler struct that
- * corresponds to a particular local_scheduler_id.
- *
- * @param state The state of the global scheduler.
- * @param The local_scheduler_id of the local scheduler.
- * @return The corresponding local scheduler struct. If the global scheduler is
- *         not aware of the local scheduler, then this will be NULL.
- */
-LocalScheduler *get_local_scheduler(GlobalSchedulerState *state,
-                                    DBClientID local_scheduler_id);
-
-/**
- * Assign the given task to the local scheduler, update Redis and scheduler data
- * structures.
- *
- * @param state Global scheduler state.
- * @param task Task to be assigned to the local scheduler.
- * @param local_scheduler_id DB client ID for the local scheduler.
- * @return Void.
- */
-void assign_task_to_local_scheduler(GlobalSchedulerState *state,
-                                    Task *task,
-                                    DBClientID local_scheduler_id);
-
-#endif /* GLOBAL_SCHEDULER_H */
diff --git a/src/global_scheduler/global_scheduler_algorithm.cc b/src/global_scheduler/global_scheduler_algorithm.cc
deleted file mode 100644
index 7ca1b86be9148..0000000000000
--- a/src/global_scheduler/global_scheduler_algorithm.cc
+++ /dev/null
@@ -1,257 +0,0 @@
-#include <limits.h>
-
-#include "task.h"
-#include "state/task_table.h"
-
-#include "global_scheduler_algorithm.h"
-
-GlobalSchedulerPolicyState *GlobalSchedulerPolicyState_init(void) {
-  GlobalSchedulerPolicyState *policy_state = new GlobalSchedulerPolicyState();
-  return policy_state;
-}
-
-void GlobalSchedulerPolicyState_free(GlobalSchedulerPolicyState *policy_state) {
-  delete policy_state;
-}
-
-/**
- * Checks if the given local scheduler satisfies the task's hard constraints.
- *
- * @param scheduler Local scheduler.
- * @param spec Task specification.
- * @return True if all tasks's resource constraints are satisfied. False
- *         otherwise.
- */
-bool constraints_satisfied_hard(const LocalScheduler *scheduler,
-                                const TaskSpec *spec) {
-  if (scheduler->info.static_resources.count("CPU") == 1 &&
-      scheduler->info.static_resources.at("CPU") == 0) {
-    // Don't give tasks to local schedulers that have 0 CPUs. This can be an
-    // issue for actor creation tasks that require 0 CPUs (but the subsequent
-    // actor methods require some CPUs).
-    return false;
-  }
-
-  for (auto const &resource_pair : TaskSpec_get_required_resources(spec)) {
-    std::string resource_name = resource_pair.first;
-    double resource_quantity = resource_pair.second;
-
-    // Continue on if the task doesn't actually require this resource.
-    if (resource_quantity == 0) {
-      continue;
-    }
-
-    // Check if the local scheduler has this resource.
-    if (scheduler->info.static_resources.count(resource_name) == 0) {
-      return false;
-    }
-
-    // Check if the local scheduler has enough of the resource.
-    if (scheduler->info.static_resources.at(resource_name) <
-        resource_quantity) {
-      return false;
-    }
-  }
-  return true;
-}
-
-int64_t locally_available_data_size(const GlobalSchedulerState *state,
-                                    DBClientID local_scheduler_id,
-                                    TaskSpec *task_spec) {
-  /* This function will compute the total size of all the object dependencies
-   * for the given task that are already locally available to the specified
-   * local scheduler. */
-  int64_t task_data_size = 0;
-
-  RAY_CHECK(state->local_scheduler_plasma_map.count(local_scheduler_id) == 1);
-
-  const std::string &plasma_manager =
-      state->local_scheduler_plasma_map.at(local_scheduler_id);
-
-  /* TODO(rkn): Note that if the same object ID appears as multiple arguments,
-   * then it will be overcounted. */
-  for (int64_t i = 0; i < TaskSpec_num_args(task_spec); ++i) {
-    int count = TaskSpec_arg_id_count(task_spec, i);
-    for (int j = 0; j < count; ++j) {
-      ObjectID object_id = TaskSpec_arg_id(task_spec, i, j);
-
-      if (state->scheduler_object_info_table.count(object_id) == 0) {
-        /* If this global scheduler is not aware of this object ID, then ignore
-         * it. */
-        continue;
-      }
-
-      const SchedulerObjectInfo &object_size_info =
-          state->scheduler_object_info_table.at(object_id);
-
-      if (std::find(object_size_info.object_locations.begin(),
-                    object_size_info.object_locations.end(), plasma_manager) ==
-          object_size_info.object_locations.end()) {
-        /* This local scheduler does not have access to this object, so don't
-         * count this object. */
-        continue;
-      }
-
-      /* Look at the size of the object. */
-      int64_t object_size = object_size_info.data_size;
-      if (object_size == -1) {
-        /* This means that this global scheduler does not know the object size
-         * yet, so assume that the object is one megabyte. TODO(rkn): Maybe we
-         * should instead use the average object size. */
-        object_size = 1000000;
-      }
-
-      /* If we get here, then this local scheduler has access to this object, so
-       * count the contribution of this object. */
-      task_data_size += object_size;
-    }
-  }
-
-  return task_data_size;
-}
-
-double calculate_cost_pending(const GlobalSchedulerState *state,
-                              const LocalScheduler *scheduler,
-                              TaskSpec *task_spec) {
-  /* Calculate how much data is already present on this machine. TODO(rkn): Note
-   * that this information is not being used yet. Fix this. */
-  locally_available_data_size(state, scheduler->id, task_spec);
-  /* TODO(rkn): This logic does not load balance properly when the different
-   * machines have different sizes. Fix this. */
-  double cost_pending = scheduler->num_recent_tasks_sent +
-                        scheduler->info.task_queue_length -
-                        scheduler->info.available_workers;
-  return cost_pending;
-}
-
-bool handle_task_waiting_random(GlobalSchedulerState *state,
-                                GlobalSchedulerPolicyState *policy_state,
-                                Task *task) {
-  TaskSpec *task_spec = Task_task_execution_spec(task)->Spec();
-  RAY_CHECK(task_spec != NULL)
-      << "task wait handler encounted a task with NULL spec";
-
-  std::vector<DBClientID> feasible_nodes;
-
-  for (const auto &it : state->local_schedulers) {
-    // Local scheduler map iterator yields <DBClientID, LocalScheduler> pairs.
-    const LocalScheduler &local_scheduler = it.second;
-    if (!constraints_satisfied_hard(&local_scheduler, task_spec)) {
-      continue;
-    }
-    // Add this local scheduler as a candidate for random selection.
-    feasible_nodes.push_back(it.first);
-  }
-
-  if (feasible_nodes.size() == 0) {
-    RAY_LOG(ERROR) << "Infeasible task. No nodes satisfy hard constraints for "
-                   << "task = " << Task_task_id(task);
-    return false;
-  }
-
-  // Randomly select the local scheduler. TODO(atumanov): replace with
-  // std::discrete_distribution<int>.
-  std::uniform_int_distribution<> dis(0, feasible_nodes.size() - 1);
-  DBClientID local_scheduler_id =
-      feasible_nodes[dis(policy_state->getRandomGenerator())];
-  RAY_CHECK(!local_scheduler_id.is_nil())
-      << "Task is feasible, but doesn't have a local scheduler assigned.";
-  // A local scheduler ID was found, so assign the task.
-  assign_task_to_local_scheduler(state, task, local_scheduler_id);
-  return true;
-}
-
-bool handle_task_waiting_cost(GlobalSchedulerState *state,
-                              GlobalSchedulerPolicyState *policy_state,
-                              Task *task) {
-  TaskSpec *task_spec = Task_task_execution_spec(task)->Spec();
-  int64_t curtime = current_time_ms();
-
-  RAY_CHECK(task_spec != NULL)
-      << "task wait handler encounted a task with NULL spec";
-
-  // For tasks already seen by the global scheduler (spillback > 1),
-  // adjust scheduled task counts for the source local scheduler.
-  if (task->execution_spec->SpillbackCount() > 1) {
-    auto it = state->local_schedulers.find(task->local_scheduler_id);
-    // Task's previous local scheduler must be present and known.
-    RAY_CHECK(it != state->local_schedulers.end());
-    LocalScheduler &src_local_scheduler = it->second;
-    src_local_scheduler.num_recent_tasks_sent -= 1;
-  }
-
-  bool task_feasible = false;
-
-  // Go through all the nodes, calculate the score for each, pick max score.
-  double best_local_scheduler_score = INT32_MIN;
-  RAY_CHECK(best_local_scheduler_score < 0)
-      << "We might have a floating point underflow";
-  RAY_LOG(INFO) << "ct[" << curtime << "] task from "
-                << task->local_scheduler_id << " spillback "
-                << task->execution_spec->SpillbackCount();
-
-  // The best node to send this task.
-  DBClientID best_local_scheduler_id = DBClientID::nil();
-
-  for (auto it = state->local_schedulers.begin();
-       it != state->local_schedulers.end(); it++) {
-    // For each local scheduler, calculate its score. Check hard constraints
-    // first.
-    LocalScheduler *scheduler = &(it->second);
-    if (!constraints_satisfied_hard(scheduler, task_spec)) {
-      continue;
-    }
-    // Skip the local scheduler the task came from.
-    if (task->local_scheduler_id == scheduler->id) {
-      continue;
-    }
-    task_feasible = true;
-    // This node satisfies the hard capacity constraint. Calculate its score.
-    double score = -1 * calculate_cost_pending(state, scheduler, task_spec);
-    RAY_LOG(INFO) << "ct[" << curtime << "][" << scheduler->id << "][q"
-                  << scheduler->info.task_queue_length << "][w"
-                  << scheduler->info.available_workers << "]: score " << score
-                  << " bestscore " << best_local_scheduler_score;
-    if (score >= best_local_scheduler_score) {
-      best_local_scheduler_score = score;
-      best_local_scheduler_id = scheduler->id;
-    }
-  }
-
-  if (!task_feasible) {
-    RAY_LOG(ERROR) << "Infeasible task. No nodes satisfy hard constraints for "
-                   << "task = " << Task_task_id(task);
-    // TODO(atumanov): propagate this error to the task's driver and/or
-    // cache the task in case new local schedulers satisfy it in the future.
-    return false;
-  }
-  RAY_CHECK(!best_local_scheduler_id.is_nil())
-      << "Task is feasible, but doesn't have a local scheduler assigned.";
-  // A local scheduler ID was found, so assign the task.
-  assign_task_to_local_scheduler(state, task, best_local_scheduler_id);
-  return true;
-}
-
-bool handle_task_waiting(GlobalSchedulerState *state,
-                         GlobalSchedulerPolicyState *policy_state,
-                         Task *task) {
-  return handle_task_waiting_random(state, policy_state, task);
-}
-
-void handle_object_available(GlobalSchedulerState *state,
-                             GlobalSchedulerPolicyState *policy_state,
-                             ObjectID object_id) {
-  /* Do nothing for now. */
-}
-
-void handle_new_local_scheduler(GlobalSchedulerState *state,
-                                GlobalSchedulerPolicyState *policy_state,
-                                DBClientID db_client_id) {
-  /* Do nothing for now. */
-}
-
-void handle_local_scheduler_removed(GlobalSchedulerState *state,
-                                    GlobalSchedulerPolicyState *policy_state,
-                                    DBClientID db_client_id) {
-  /* Do nothing for now. */
-}
diff --git a/src/global_scheduler/global_scheduler_algorithm.h b/src/global_scheduler/global_scheduler_algorithm.h
deleted file mode 100644
index 69be67d97477d..0000000000000
--- a/src/global_scheduler/global_scheduler_algorithm.h
+++ /dev/null
@@ -1,126 +0,0 @@
-#ifndef GLOBAL_SCHEDULER_ALGORITHM_H
-#define GLOBAL_SCHEDULER_ALGORITHM_H
-
-#include <chrono>
-#include <random>
-
-#include "common.h"
-#include "global_scheduler.h"
-#include "task.h"
-
-/* ==== The scheduling algorithm ====
- *
- * This file contains declaration for all functions and data structures that
- * need to be provided if you want to implement a new algorithm for the global
- * scheduler.
- *
- */
-
-enum class GlobalSchedulerAlgorithm {
-  SCHED_ALGORITHM_ROUND_ROBIN = 1,
-  SCHED_ALGORITHM_TRANSFER_AWARE = 2,
-  SCHED_ALGORITHM_MAX
-};
-
-/// The class encapsulating state managed by the global scheduling policy.
-class GlobalSchedulerPolicyState {
- public:
-  GlobalSchedulerPolicyState(int64_t round_robin_index)
-      : round_robin_index_(round_robin_index),
-        gen_(std::chrono::high_resolution_clock::now()
-                 .time_since_epoch()
-                 .count()) {}
-
-  GlobalSchedulerPolicyState()
-      : round_robin_index_(0),
-        gen_(std::chrono::high_resolution_clock::now()
-                 .time_since_epoch()
-                 .count()) {}
-
-  /// Return the policy's random number generator.
-  ///
-  /// @return The policy's random number generator.
-  std::mt19937_64 &getRandomGenerator() { return gen_; }
-
-  /// Return the round robin index maintained by policy state.
-  ///
-  /// @return The round robin index.
-  int64_t getRoundRobinIndex() const { return round_robin_index_; }
-
- private:
-  /// The index of the next local scheduler to assign a task to.
-  int64_t round_robin_index_;
-  /// Internally maintained random number generator.
-  std::mt19937_64 gen_;
-};
-
-/**
- * Create the state of the global scheduler policy. This state must be freed by
- * the caller.
- *
- * @return The state of the scheduling policy.
- */
-GlobalSchedulerPolicyState *GlobalSchedulerPolicyState_init(void);
-
-/**
- * Free the global scheduler policy state.
- *
- * @param policy_state The policy state to free.
- * @return Void.
- */
-void GlobalSchedulerPolicyState_free(GlobalSchedulerPolicyState *policy_state);
-
-/**
- * Main new task handling function in the global scheduler.
- *
- * @param state Global scheduler state.
- * @param policy_state State specific to the scheduling policy.
- * @param task New task to be scheduled.
- * @return True if the task was assigned to a local scheduler and false
- *         otherwise.
- */
-bool handle_task_waiting(GlobalSchedulerState *state,
-                         GlobalSchedulerPolicyState *policy_state,
-                         Task *task);
-
-/**
- * Handle the fact that a new object is available.
- *
- * @param state The global scheduler state.
- * @param policy_state The state managed by the scheduling policy.
- * @param object_id The ID of the object that is now available.
- * @return Void.
- */
-void handle_object_available(GlobalSchedulerState *state,
-                             GlobalSchedulerPolicyState *policy_state,
-                             ObjectID object_id);
-
-/**
- * Handle a heartbeat message from a local scheduler. TODO(rkn): this is a
- * placeholder for now.
- *
- * @param state The global scheduler state.
- * @param policy_state The state managed by the scheduling policy.
- * @return Void.
- */
-void handle_local_scheduler_heartbeat(GlobalSchedulerState *state,
-                                      GlobalSchedulerPolicyState *policy_state);
-
-/**
- * Handle the presence of a new local scheduler. Currently, this just adds the
- * local scheduler to a queue of local schedulers.
- *
- * @param state The global scheduler state.
- * @param policy_state The state managed by the scheduling policy.
- * @param The db client ID of the new local scheduler.
- * @return Void.
- */
-void handle_new_local_scheduler(GlobalSchedulerState *state,
-                                GlobalSchedulerPolicyState *policy_state,
-                                DBClientID db_client_id);
-
-void handle_local_scheduler_removed(GlobalSchedulerState *state,
-                                    GlobalSchedulerPolicyState *policy_state,
-                                    DBClientID db_client_id);
-
-#endif /* GLOBAL_SCHEDULER_ALGORITHM_H */
diff --git a/src/local_scheduler/CMakeLists.txt b/src/local_scheduler/CMakeLists.txt
deleted file mode 100644
index 7033c4f2306cf..0000000000000
--- a/src/local_scheduler/CMakeLists.txt
+++ /dev/null
@@ -1,104 +0,0 @@
-cmake_minimum_required(VERSION 3.4)
-
-project(local_scheduler)
-
-add_definitions(-fPIC)
-
-if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
-  include_directories("${PYTHON_INCLUDE_DIRS}")
-  include_directories("${NUMPY_INCLUDE_DIR}")
-endif()
-
-set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Werror -Wall")
-
-if(UNIX AND NOT APPLE)
-  link_libraries(rt)
-endif()
-
-include_directories("${CMAKE_CURRENT_LIST_DIR}/")
-include_directories("${CMAKE_CURRENT_LIST_DIR}/../")
-# TODO(pcm): get rid of this:
-if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
-  include_directories("${CMAKE_CURRENT_LIST_DIR}/../plasma/")
-endif()
-
-include_directories("${ARROW_INCLUDE_DIR}")
-include_directories("${CMAKE_CURRENT_LIST_DIR}/../common/format/")
-
-# Compile flatbuffers
-
-set(LOCAL_SCHEDULER_FBS_SRC "${CMAKE_CURRENT_LIST_DIR}/format/local_scheduler.fbs")
-set(OUTPUT_DIR ${CMAKE_CURRENT_LIST_DIR}/format/)
-
-set(LOCAL_SCHEDULER_FBS_OUTPUT_FILES
-  "${OUTPUT_DIR}/local_scheduler_generated.h")
-
-add_custom_command(
-  OUTPUT ${LOCAL_SCHEDULER_FBS_OUTPUT_FILES}
-  COMMAND ${FLATBUFFERS_COMPILER} -c -o ${OUTPUT_DIR} ${LOCAL_SCHEDULER_FBS_SRC} --gen-object-api --scoped-enums
-  DEPENDS ${FBS_DEPENDS}
-  COMMENT "Running flatc compiler on ${LOCAL_SCHEDULER_FBS_SRC}"
-  VERBATIM)
-
-add_custom_target(gen_local_scheduler_fbs DEPENDS ${LOCAL_SCHEDULER_FBS_OUTPUT_FILES})
-
-add_dependencies(gen_local_scheduler_fbs arrow)
-
-add_library(local_scheduler_client STATIC local_scheduler_client.cc)
-
-# local_scheduler_shared.h includes ray/gcs/client.h which requires gen_gcs_fbs & gen_node_manager_fbs.
-add_dependencies(local_scheduler_client common hiredis gen_local_scheduler_fbs ${COMMON_FBS_OUTPUT_FILES} gen_gcs_fbs gen_node_manager_fbs)
-
-add_executable(local_scheduler local_scheduler.cc local_scheduler_algorithm.cc)
-add_dependencies(local_scheduler hiredis)
-target_link_libraries(local_scheduler local_scheduler_client common ${HIREDIS_LIB} ${PLASMA_STATIC_LIB} ray_static ${ARROW_STATIC_LIB} -lpthread ${Boost_SYSTEM_LIBRARY})
-
-add_executable(local_scheduler_tests test/local_scheduler_tests.cc local_scheduler.cc local_scheduler_algorithm.cc)
-add_dependencies(local_scheduler_tests hiredis)
-target_link_libraries(local_scheduler_tests local_scheduler_client common ${HIREDIS_LIB} ${PLASMA_STATIC_LIB} ray_static ${ARROW_STATIC_LIB} -lpthread ${Boost_SYSTEM_LIBRARY})
-target_compile_options(local_scheduler_tests PUBLIC "-DLOCAL_SCHEDULER_TEST")
-
-macro(get_local_scheduler_library LANG VAR)
-  set(${VAR} "local_scheduler_library_${LANG}")
-endmacro()
-
-macro(set_local_scheduler_library LANG)
-  get_local_scheduler_library(${LANG} LOCAL_SCHEDULER_LIBRARY_${LANG})
-  set(LOCAL_SCHEDULER_LIBRARY_LANG ${LOCAL_SCHEDULER_LIBRARY_${LANG}})
-  include_directories("${CMAKE_CURRENT_LIST_DIR}/../common/lib/${LANG}/")
-
-  file(GLOB LOCAL_SCHEDULER_LIBRARY_${LANG}_SRC
-    lib/${LANG}/*.cc
-    ${CMAKE_CURRENT_LIST_DIR}/../common/lib/${LANG}/*.cc)
-  add_library(${LOCAL_SCHEDULER_LIBRARY_LANG} SHARED
-    ${LOCAL_SCHEDULER_LIBRARY_${LANG}_SRC})
-
-    if(APPLE)
-      if ("${LANG}" STREQUAL "python")
-        SET_TARGET_PROPERTIES(${LOCAL_SCHEDULER_LIBRARY_LANG} PROPERTIES SUFFIX .so)
-      endif()
-      target_link_libraries(${LOCAL_SCHEDULER_LIBRARY_LANG} "-undefined dynamic_lookup" local_scheduler_client common ray_static ${PLASMA_STATIC_LIB} ${ARROW_STATIC_LIB} ${Boost_SYSTEM_LIBRARY})
-    else(APPLE)
-      target_link_libraries(${LOCAL_SCHEDULER_LIBRARY_LANG} local_scheduler_client common ray_static ${PLASMA_STATIC_LIB} ${ARROW_STATIC_LIB} ${Boost_SYSTEM_LIBRARY})
-    endif(APPLE)
-
-  add_dependencies(${LOCAL_SCHEDULER_LIBRARY_LANG} gen_local_scheduler_fbs)
-
-  install(TARGETS ${LOCAL_SCHEDULER_LIBRARY_LANG} DESTINATION ${CMAKE_SOURCE_DIR}/local_scheduler)
-endmacro()
-
-if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
-  set_local_scheduler_library("python")
-endif()
-
-if ("${CMAKE_RAY_LANG_JAVA}" STREQUAL "YES")
-  add_compile_options("-I$ENV{JAVA_HOME}/include/")
-  if(WIN32)
-    add_compile_options("-I$ENV{JAVA_HOME}/include/win32")
-  elseif(APPLE)
-    add_compile_options("-I$ENV{JAVA_HOME}/include/darwin")
-  else() # linux
-    add_compile_options("-I$ENV{JAVA_HOME}/include/linux")
-  endif()
-  set_local_scheduler_library("java")
-endif()
diff --git a/src/local_scheduler/build/.gitkeep b/src/local_scheduler/build/.gitkeep
deleted file mode 100644
index e69de29bb2d1d..0000000000000
diff --git a/src/local_scheduler/format/local_scheduler.fbs b/src/local_scheduler/format/local_scheduler.fbs
deleted file mode 100644
index ffdf13d6aea41..0000000000000
--- a/src/local_scheduler/format/local_scheduler.fbs
+++ /dev/null
@@ -1,127 +0,0 @@
-// Local scheduler protocol specification
-namespace ray.local_scheduler.protocol;
-
-enum MessageType:int {
-  // Task is submitted to the local scheduler. This is sent from a worker to a
-  // local scheduler.
-  SubmitTask = 1,
-  // Notify the local scheduler that a task has finished. This is sent from a
-  // worker to a local scheduler.
-  TaskDone,
-  // Log a message to the event table. This is sent from a worker to a local
-  // scheduler.
-  EventLogMessage,
-  // Send an initial connection message to the local scheduler. This is sent
-  // from a worker or driver to a local scheduler.
-  RegisterClientRequest,
-  // Send a reply confirming the successful registration of a worker or driver.
-  // This is sent from the local scheduler to a worker or driver.
-  RegisterClientReply,
-  // Notify the local scheduler that this client is disconnecting gracefully.
-  // This is sent from a worker to a local scheduler.
-  DisconnectClient,
-  // Get a new task from the local scheduler. This is sent from a worker to a
-  // local scheduler.
-  GetTask,
-  // Tell a worker to execute a task. This is sent from a local scheduler to a
-  // worker.
-  ExecuteTask,
-  // Reconstruct or fetch possibly lost objects. This is sent from a worker to
-  // a local scheduler.
-  ReconstructObjects,
-  // For a worker that was blocked on some object(s), tell the local scheduler
-  // that the worker is now unblocked. This is sent from a worker to a local
-  // scheduler.
-  NotifyUnblocked,
-  // Add a result table entry for an object put.
-  PutObject,
-  // A request to get the task frontier for an actor, called by the actor when
-  // saving a checkpoint.
-  GetActorFrontierRequest,
-  // The ActorFrontier response to a GetActorFrontierRequest. The local
-  // scheduler returns the actor's per-handle task counts and execution
-  // dependencies, which can later be used as the argument to SetActorFrontier
-  // when resuming from the checkpoint.
-  GetActorFrontierReply,
-  // A request to set the task frontier for an actor, called when resuming from
-  // a checkpoint. The local scheduler will update the actor's per-handle task
-  // counts and execution dependencies, discard any tasks that already executed
-  // before the checkpoint, and make any tasks on the frontier runnable by
-  // making their execution dependencies available.
-  SetActorFrontier
-}
-
-table SubmitTaskRequest {
-  execution_dependencies: [string];
-  task_spec: string;
-}
-
-// This message is sent from the local scheduler to a worker.
-table GetTaskReply {
-  // A string of bytes representing the task specification.
-  task_spec: string;
-  // The IDs of the GPUs that the worker is allowed to use for this task.
-  gpu_ids: [int];
-}
-
-table EventLogMessage {
-  key: string;
-  value: string;
-  timestamp: double;
-}
-
-// This struct is used to register a new worker with the local scheduler.
-// It is shipped as part of local_scheduler_connect.
-table RegisterClientRequest {
-  // True if the client is a worker and false if the client is a driver.
-  is_worker: bool;
-  // The ID of the worker or driver.
-  client_id: string;
-  // The process ID of this worker.
-  worker_pid: long;
-  // The driver ID. This is non-nil if the client is a driver.
-  driver_id: string;
-}
-
-table DisconnectClient {
-}
-
-table ReconstructObjects {
-  // List of object IDs of the objects that we want to reconstruct or fetch.
-  object_ids: [string];
-  // Do we only want to fetch the objects or also reconstruct them?
-  fetch_only: bool;
-}
-
-table PutObject {
-  // Task ID of the task that performed the put.
-  task_id: string;
-  // Object ID of the object that is being put.
-  object_id: string;
-}
-
-// The ActorFrontier is used to represent the current frontier of tasks that
-// the local scheduler has marked as runnable for a particular actor. It is
-// used to save the point in an actor's lifetime at which a checkpoint was
-// taken, so that the same frontier of tasks can be made runnable again if the
-// actor is resumed from that checkpoint.
-table ActorFrontier {
-  // Actor ID of the actor whose frontier is described.
-  actor_id: string;
-  // A list of handle IDs, representing the callers of the actor that have
-  // submitted a runnable task to the local scheduler. A nil ID represents the
-  // creator of the actor.
-  handle_ids: [string];
-  // A list representing the number of tasks executed so far, per handle. Each
-  // count in task_counters corresponds to the handle at the same in index in
-  // handle_ids.
-  task_counters: [long];
-  // A list representing the execution dependency for the next runnable task,
-  // per handle. Each execution dependency in frontier_dependencies corresponds
-  // to the handle at the same in index in handle_ids.
-  frontier_dependencies: [string];
-}
-
-table GetActorFrontierRequest {
-  actor_id: string;
-}
diff --git a/src/local_scheduler/lib/java/org_ray_runtime_raylet_RayletClientImpl.h b/src/local_scheduler/lib/java/org_ray_runtime_raylet_RayletClientImpl.h
deleted file mode 100644
index b730b00643d54..0000000000000
--- a/src/local_scheduler/lib/java/org_ray_runtime_raylet_RayletClientImpl.h
+++ /dev/null
@@ -1,134 +0,0 @@
-/* DO NOT EDIT THIS FILE - it is machine generated */
-#include <jni.h>
-/* Header for class org_ray_runtime_raylet_RayletClientImpl */
-
-#ifndef _Included_org_ray_runtime_raylet_RayletClientImpl
-#define _Included_org_ray_runtime_raylet_RayletClientImpl
-#ifdef __cplusplus
-extern "C" {
-#endif
-/*
- * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativeInit
- * Signature: (Ljava/lang/String;[BZ[B)J
- */
-JNIEXPORT jlong JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeInit(JNIEnv *,
-                                                        jclass,
-                                                        jstring,
-                                                        jbyteArray,
-                                                        jboolean,
-                                                        jbyteArray);
-
-/*
- * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativeSubmitTask
- * Signature: (J[BLjava/nio/ByteBuffer;II)V
- */
-JNIEXPORT void JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeSubmitTask(JNIEnv *,
-                                                              jclass,
-                                                              jlong,
-                                                              jbyteArray,
-                                                              jobject,
-                                                              jint,
-                                                              jint);
-
-/*
- * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativeGetTask
- * Signature: (J)[B
- */
-JNIEXPORT jbyteArray JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeGetTask(JNIEnv *,
-                                                           jclass,
-                                                           jlong);
-
-/*
- * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativeDestroy
- * Signature: (J)V
- */
-JNIEXPORT void JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeDestroy(JNIEnv *,
-                                                           jclass,
-                                                           jlong);
-
-/*
- * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativeReconstructObjects
- * Signature: (J[[BZ)V
- */
-JNIEXPORT void JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeReconstructObjects(
-    JNIEnv *,
-    jclass,
-    jlong,
-    jobjectArray,
-    jboolean);
-
-/*
- * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativeNotifyUnblocked
- * Signature: (J)V
- */
-JNIEXPORT void JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeNotifyUnblocked(JNIEnv *,
-                                                                   jclass,
-                                                                   jlong);
-
-/*
- * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativePutObject
- * Signature: (J[B[B)V
- */
-JNIEXPORT void JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativePutObject(JNIEnv *,
-                                                             jclass,
-                                                             jlong,
-                                                             jbyteArray,
-                                                             jbyteArray);
-
-/*
- * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativeWaitObject
- * Signature: (J[[BIIZ)[Z
- */
-JNIEXPORT jbooleanArray JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeWaitObject(JNIEnv *,
-                                                              jclass,
-                                                              jlong,
-                                                              jobjectArray,
-                                                              jint,
-                                                              jint,
-                                                              jboolean);
-
-/*
- * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativeGenerateTaskId
- * Signature: ([B[BI)[B
- */
-JNIEXPORT jbyteArray JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeGenerateTaskId(JNIEnv *,
-                                                                  jclass,
-                                                                  jbyteArray,
-                                                                  jbyteArray,
-                                                                  jint);
-
-/*
- * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativeFreePlasmaObjects
- * Signature: (J[[BZ)V
- */
-JNIEXPORT void JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeFreePlasmaObjects(
-    JNIEnv *,
-    jclass,
-    jlong,
-    jobjectArray,
-    jboolean);
-
-#ifdef __cplusplus
-}
-#endif
-#endif
diff --git a/src/local_scheduler/local_scheduler.cc b/src/local_scheduler/local_scheduler.cc
deleted file mode 100644
index 7bef00993ab9b..0000000000000
--- a/src/local_scheduler/local_scheduler.cc
+++ /dev/null
@@ -1,1555 +0,0 @@
-#include <sstream>
-
-#include <signal.h>
-#include <stdio.h>
-#include <stdlib.h>
-#include <sys/socket.h>
-#include <sys/un.h>
-#include <sys/wait.h>
-#include <unistd.h>
-
-#include <string>
-
-#include "common.h"
-#include "common_protocol.h"
-#include "event_loop.h"
-#include "format/local_scheduler_generated.h"
-#include "io.h"
-#include "local_scheduler.h"
-#include "local_scheduler_algorithm.h"
-#include "local_scheduler_shared.h"
-#include "logging.h"
-#include "net.h"
-#include "ray/util/util.h"
-#include "state/actor_notification_table.h"
-#include "state/db.h"
-#include "state/db_client_table.h"
-#include "state/driver_table.h"
-#include "state/error_table.h"
-#include "state/object_table.h"
-#include "state/task_table.h"
-
-using MessageType = ray::local_scheduler::protocol::MessageType;
-
-/**
- * A helper function for printing available and requested resource information.
- *
- * @param state Local scheduler state.
- * @param spec Task specification object.
- * @return Void.
- */
-void print_resource_info(const LocalSchedulerState *state,
-                         const TaskSpec *spec) {
-#if RAY_COMMON_LOG_LEVEL <= RAY_COMMON_DEBUG
-  // Print information about available and requested resources.
-  std::cout << "Static Resources: " << std::endl;
-  for (auto const &resource_pair : state->static_resources) {
-    std::cout << "    " << resource_pair.first << ": " << resource_pair.second
-              << std::endl;
-  }
-  std::cout << "Dynamic Resources: " << std::endl;
-  for (auto const &resource_pair : state->dynamic_resources) {
-    std::cout << "    " << resource_pair.first << ": " << resource_pair.second
-              << std::endl;
-  }
-  if (spec) {
-    std::cout << "Task Required Resources: " << std::endl;
-    for (auto const &resource_pair : TaskSpec_get_required_resources(spec)) {
-      std::cout << "    " << resource_pair.first << ": " << resource_pair.second
-                << std::endl;
-    }
-  }
-#endif
-}
-
-int force_kill_worker(event_loop *loop, timer_id id, void *context) {
-  LocalSchedulerClient *worker = (LocalSchedulerClient *) context;
-  kill(worker->pid, SIGKILL);
-  close(worker->sock);
-  delete worker;
-  return EVENT_LOOP_TIMER_DONE;
-}
-
-void kill_worker(LocalSchedulerState *state,
-                 LocalSchedulerClient *worker,
-                 bool cleanup,
-                 bool suppress_warning) {
-  /* Erase the local scheduler's reference to the worker. */
-  auto it = std::find(state->workers.begin(), state->workers.end(), worker);
-  RAY_CHECK(it != state->workers.end());
-  state->workers.erase(it);
-
-  /* Make sure that we removed the worker. */
-  it = std::find(state->workers.begin(), state->workers.end(), worker);
-  RAY_CHECK(it == state->workers.end());
-
-  /* Release any resources held by the worker. It's important to do this before
-   * calling handle_worker_removed and handle_actor_worker_disconnect because
-   * freeing up resources here will allow the scheduling algorithm to dispatch
-   * more tasks. */
-  release_resources(state, worker, worker->resources_in_use);
-
-  /* Erase the algorithm state's reference to the worker. */
-  if (worker->actor_id.is_nil()) {
-    handle_worker_removed(state, state->algorithm_state, worker);
-  } else {
-    /* Let the scheduling algorithm process the absence of this worker. */
-    handle_actor_worker_disconnect(state, state->algorithm_state, worker,
-                                   cleanup);
-  }
-
-  /* Remove the client socket from the event loop so that we don't process the
-   * SIGPIPE when the worker is killed. */
-  event_loop_remove_file(state->loop, worker->sock);
-
-  /* If the worker has registered a process ID with us and it's a child
-   * process, use it to send a kill signal. */
-  bool free_worker = true;
-  if (worker->is_child && worker->pid != 0) {
-    /* If worker is a driver, we should not enter this condition because
-     * worker->pid should be 0. */
-    if (cleanup) {
-      /* If we're exiting the local scheduler anyway, it's okay to force kill
-       * the worker immediately. Wait for the process to exit. */
-      kill(worker->pid, SIGKILL);
-      waitpid(worker->pid, NULL, 0);
-      close(worker->sock);
-    } else {
-      /* If we're just cleaning up a single worker, allow it some time to clean
-       * up its state before force killing. The client socket will be closed
-       * and the worker struct will be freed after the timeout. */
-      kill(worker->pid, SIGTERM);
-      event_loop_add_timer(
-          state->loop, RayConfig::instance().kill_worker_timeout_milliseconds(),
-          force_kill_worker, (void *) worker);
-      free_worker = false;
-    }
-    RAY_LOG(DEBUG) << "Killed worker with pid " << worker->pid;
-  }
-
-  /* If this worker is still running a task and we aren't cleaning up, push an
-   * error message to the driver responsible for the task. */
-  if (worker->task_in_progress != NULL && !cleanup && !suppress_warning) {
-    TaskSpec *spec = Task_task_execution_spec(worker->task_in_progress)->Spec();
-
-    std::ostringstream error_message;
-    error_message << "The worker with ID " << worker->client_id << " died or "
-                  << "was killed while executing the task with ID "
-                  << TaskSpec_task_id(spec);
-    push_error(state->db, TaskSpec_driver_id(spec), ErrorIndex::WORKER_DIED,
-               error_message.str());
-  }
-
-  /* Clean up the task in progress. */
-  if (worker->task_in_progress) {
-    /* Update the task table to reflect that the task failed to complete. */
-    if (state->db != NULL) {
-      Task_set_state(worker->task_in_progress, TaskStatus::LOST);
-      task_table_update(state->db, worker->task_in_progress, NULL, NULL, NULL);
-    } else {
-      Task_free(worker->task_in_progress);
-    }
-  }
-
-  RAY_LOG(DEBUG) << "Killed worker with pid " << worker->pid;
-  if (free_worker) {
-    /* Clean up the client socket after killing the worker so that the worker
-     * can't receive the SIGPIPE before exiting. */
-    close(worker->sock);
-    delete worker;
-  }
-}
-
-void LocalSchedulerState_free(LocalSchedulerState *state) {
-  /* Reset the SIGTERM handler to default behavior, so we try to clean up the
-   * local scheduler at most once. If a SIGTERM is caught afterwards, there is
-   * the possibility of orphan worker processes. */
-  signal(SIGTERM, SIG_DFL);
-  /* Send a null heartbeat that tells the global scheduler that we are dead to
-   * avoid waiting for the heartbeat timeout. */
-  if (state->db != NULL) {
-    local_scheduler_table_disconnect(state->db);
-  }
-
-  /* Kill any child processes that didn't register as a worker yet. */
-  for (auto const &worker_pid : state->child_pids) {
-    kill(worker_pid, SIGKILL);
-    waitpid(worker_pid, NULL, 0);
-    RAY_LOG(INFO) << "Killed worker pid " << worker_pid
-                  << " which hadn't started yet.";
-  }
-
-  /* Kill any registered workers. */
-  /* TODO(swang): It's possible that the local scheduler will exit before all
-   * of its task table updates make it to redis. */
-  while (state->workers.size() > 0) {
-    /* Note that kill_worker modifies the container state->workers, so it is
-     * important to do this loop in a way that does not use invalidated
-     * iterators. */
-    kill_worker(state, state->workers.back(), true, false);
-  }
-
-  /* Disconnect from plasma. */
-  ARROW_CHECK_OK(state->plasma_conn->Disconnect());
-  delete state->plasma_conn;
-  state->plasma_conn = NULL;
-
-  /* Clean up the database connection. NOTE(swang): The global scheduler is
-   * responsible for deleting our entry from the db_client table, so do not
-   * delete it here. */
-  if (state->db != NULL) {
-    DBHandle_free(state->db);
-  }
-
-  /* Free the command for starting new workers. */
-  if (state->config.start_worker_command != NULL) {
-    int i = 0;
-    const char *arg = state->config.start_worker_command[i];
-    while (arg != NULL) {
-      free((void *) arg);
-      ++i;
-      arg = state->config.start_worker_command[i];
-    }
-    free(state->config.start_worker_command);
-    state->config.start_worker_command = NULL;
-  }
-
-  /* Free the algorithm state. */
-  SchedulingAlgorithmState_free(state->algorithm_state);
-  state->algorithm_state = NULL;
-
-  event_loop *loop = state->loop;
-
-  /* Free the scheduler state. */
-  delete state;
-
-  /* Destroy the event loop. */
-  destroy_outstanding_callbacks(loop);
-  event_loop_destroy(loop);
-}
-
-void start_worker(LocalSchedulerState *state) {
-  /* We can't start a worker if we don't have the path to the worker script. */
-  if (state->config.start_worker_command == NULL) {
-    RAY_LOG(DEBUG) << "No valid command to start worker provided. Cannot start "
-                   << "worker.";
-    return;
-  }
-  /* Launch the process to create the worker. */
-  pid_t pid = fork();
-  if (pid != 0) {
-    state->child_pids.push_back(pid);
-    RAY_LOG(DEBUG) << "Started worker with pid " << pid;
-    return;
-  }
-
-  /* Reset the SIGCHLD handler so that it doesn't influence the worker. */
-  signal(SIGCHLD, SIG_DFL);
-
-  std::vector<const char *> command_vector;
-  for (int i = 0; state->config.start_worker_command[i] != NULL; i++) {
-    command_vector.push_back(state->config.start_worker_command[i]);
-  }
-
-  /* Add a NULL pointer to the end. */
-  command_vector.push_back(NULL);
-
-  /* Try to execute the worker command. Exit if we're not successful. */
-  execvp(command_vector[0], (char *const *) command_vector.data());
-
-  LocalSchedulerState_free(state);
-  RAY_LOG(FATAL) << "Failed to start worker";
-}
-
-/**
- * Parse the command to start a worker. This takes in the command string,
- * splits it into tokens on the space characters, and allocates an array of the
- * tokens, terminated by a NULL pointer.
- *
- * @param command The command string to start a worker.
- * @return A pointer to an array of strings, the tokens in the command string.
- *         The last element is a NULL pointer.
- */
-const char **parse_command(const char *command) {
-  /* Count the number of tokens. */
-  char *command_copy = strdup(command);
-  const char *delimiter = " ";
-  char *token = NULL;
-  int num_args = 0;
-  token = strtok(command_copy, delimiter);
-  while (token != NULL) {
-    ++num_args;
-    token = strtok(NULL, delimiter);
-  }
-  free(command_copy);
-
-  /* Allocate a NULL-terminated array for the tokens. */
-  const char **command_args =
-      (const char **) malloc((num_args + 1) * sizeof(const char *));
-  command_args[num_args] = NULL;
-
-  /* Fill in the token array. */
-  command_copy = strdup(command);
-  token = strtok(command_copy, delimiter);
-  int i = 0;
-  while (token != NULL) {
-    command_args[i] = strdup(token);
-    ++i;
-    token = strtok(NULL, delimiter);
-  }
-  free(command_copy);
-
-  RAY_CHECK(num_args == i);
-  return command_args;
-}
-
-LocalSchedulerState *LocalSchedulerState_init(
-    const char *node_ip_address,
-    event_loop *loop,
-    const char *redis_primary_addr,
-    int redis_primary_port,
-    const char *local_scheduler_socket_name,
-    const char *plasma_store_socket_name,
-    const char *plasma_manager_socket_name,
-    const char *plasma_manager_address,
-    bool global_scheduler_exists,
-    const std::unordered_map<std::string, double> &static_resource_conf,
-    const char *start_worker_command,
-    int num_workers) {
-  LocalSchedulerState *state = new LocalSchedulerState();
-  /* Set the configuration struct for the local scheduler. */
-  if (start_worker_command != NULL) {
-    state->config.start_worker_command = parse_command(start_worker_command);
-  } else {
-    state->config.start_worker_command = NULL;
-  }
-  if (start_worker_command == NULL) {
-    RAY_LOG(WARNING) << "No valid command to start a worker provided, local "
-                     << "scheduler will not start any workers.";
-  }
-  state->config.global_scheduler_exists = global_scheduler_exists;
-
-  state->loop = loop;
-
-  /* Connect to Redis if a Redis address is provided. */
-  if (redis_primary_addr != NULL) {
-    /* Construct db_connect_args */
-    std::vector<std::string> db_connect_args;
-    db_connect_args.push_back("local_scheduler_socket_name");
-    db_connect_args.push_back(local_scheduler_socket_name);
-    for (auto const &resource_pair : static_resource_conf) {
-      // TODO(rkn): This could cause issues if a resource name collides with
-      // another field name "manager_address".
-      db_connect_args.push_back(resource_pair.first);
-      db_connect_args.push_back(std::to_string(resource_pair.second));
-    }
-
-    if (plasma_manager_address != NULL) {
-      db_connect_args.push_back("manager_address");
-      db_connect_args.push_back(plasma_manager_address);
-    }
-
-    state->db = db_connect(std::string(redis_primary_addr), redis_primary_port,
-                           "local_scheduler", node_ip_address, db_connect_args);
-    db_attach(state->db, loop, false);
-  } else {
-    state->db = NULL;
-  }
-  /* Connect to Plasma. This method will retry if Plasma hasn't started yet. */
-  state->plasma_conn = new plasma::PlasmaClient();
-  if (plasma_manager_socket_name != NULL) {
-    ARROW_CHECK_OK(state->plasma_conn->Connect(
-        plasma_store_socket_name, plasma_manager_socket_name,
-        plasma::kPlasmaDefaultReleaseDelay));
-  } else {
-    ARROW_CHECK_OK(state->plasma_conn->Connect(
-        plasma_store_socket_name, "", plasma::kPlasmaDefaultReleaseDelay));
-  }
-  /* Subscribe to notifications about sealed objects. */
-  int plasma_fd;
-  ARROW_CHECK_OK(state->plasma_conn->Subscribe(&plasma_fd));
-  /* Add the callback that processes the notification to the event loop. */
-  event_loop_add_file(loop, plasma_fd, EVENT_LOOP_READ,
-                      process_plasma_notification, state);
-  /* Add scheduler state. */
-  state->algorithm_state = SchedulingAlgorithmState_init();
-
-  /* Initialize resource vectors. */
-  state->static_resources = static_resource_conf;
-  state->dynamic_resources = static_resource_conf;
-  /* Initialize available GPUs. */
-  if (state->static_resources.count("GPU") == 1) {
-    for (int i = 0; i < state->static_resources["GPU"]; ++i) {
-      state->available_gpus.push_back(i);
-    }
-  }
-  /* Print some debug information about resource configuration. */
-  print_resource_info(state, NULL);
-
-  /* Start the initial set of workers. */
-  for (int i = 0; i < num_workers; ++i) {
-    start_worker(state);
-  }
-
-  /* Initialize the time at which the previous heartbeat was sent. */
-  state->previous_heartbeat_time = current_time_ms();
-
-  return state;
-}
-
-/* TODO(atumanov): vectorize resource counts on input. */
-bool check_dynamic_resources(
-    LocalSchedulerState *state,
-    const std::unordered_map<std::string, double> &resources) {
-  for (auto const &resource_pair : resources) {
-    std::string resource_name = resource_pair.first;
-    double resource_quantity = resource_pair.second;
-    if (state->dynamic_resources[resource_name] < resource_quantity) {
-      return false;
-    }
-  }
-  return true;
-}
-
-void resource_sanity_checks(LocalSchedulerState *state,
-                            LocalSchedulerClient *worker) {
-  // Check the resources in use by the worker.
-  for (auto const &resource_pair : worker->resources_in_use) {
-    const std::string resource_name = resource_pair.first;
-    double resource_quantity = resource_pair.second;
-
-    RAY_CHECK(state->dynamic_resources[resource_name] <=
-              state->static_resources[resource_name]);
-    if (resource_name != std::string("CPU")) {
-      RAY_CHECK(state->dynamic_resources[resource_name] >= 0);
-    }
-
-    RAY_CHECK(resource_quantity >= 0);
-    RAY_CHECK(resource_quantity <= state->static_resources[resource_name]);
-  }
-}
-
-/* TODO(atumanov): just pass the required resource vector of doubles. */
-void acquire_resources(
-    LocalSchedulerState *state,
-    LocalSchedulerClient *worker,
-    const std::unordered_map<std::string, double> &resources) {
-  // Loop over each required resource type and acquire the appropriate quantity.
-  for (auto const &resource_pair : resources) {
-    const std::string resource_name = resource_pair.first;
-    double resource_quantity = resource_pair.second;
-
-    // Do some special handling for GPU resources.
-    if (resource_name == std::string("GPU")) {
-      if (resource_quantity != 0) {
-        // Make sure that the worker isn't using any GPUs already.
-        RAY_CHECK(worker->gpus_in_use.size() == 0);
-        RAY_CHECK(state->available_gpus.size() >= resource_quantity);
-        // Reserve GPUs for the worker.
-        for (int i = 0; i < resource_quantity; i++) {
-          worker->gpus_in_use.push_back(state->available_gpus.back());
-          state->available_gpus.pop_back();
-        }
-      }
-    }
-
-    // Do bookkeeping for general resource types.
-    if (resource_name != std::string("CPU")) {
-      RAY_CHECK(state->dynamic_resources[resource_name] >= resource_quantity);
-    }
-    state->dynamic_resources[resource_name] -= resource_quantity;
-    worker->resources_in_use[resource_name] += resource_quantity;
-  }
-
-  // Do some sanity checks.
-  resource_sanity_checks(state, worker);
-}
-
-void release_resources(
-    LocalSchedulerState *state,
-    LocalSchedulerClient *worker,
-    const std::unordered_map<std::string, double> &resources) {
-  for (auto const &resource_pair : resources) {
-    const std::string resource_name = resource_pair.first;
-    double resource_quantity = resource_pair.second;
-
-    // Do some special handling for GPU resources.
-    if (resource_name == std::string("GPU")) {
-      if (resource_quantity != 0) {
-        RAY_CHECK(resource_quantity == worker->gpus_in_use.size());
-        // Move the GPU IDs the worker was using back to the local scheduler.
-        for (auto const &gpu_id : worker->gpus_in_use) {
-          state->available_gpus.push_back(gpu_id);
-        }
-        worker->gpus_in_use.clear();
-      }
-    }
-
-    // Do bookkeeping for general resources types.
-    state->dynamic_resources[resource_name] += resource_quantity;
-    worker->resources_in_use[resource_name] -= resource_quantity;
-  }
-
-  // Do some sanity checks.
-  resource_sanity_checks(state, worker);
-}
-
-bool is_driver_alive(LocalSchedulerState *state, WorkerID driver_id) {
-  return state->removed_drivers.count(driver_id) == 0;
-}
-
-void assign_task_to_worker(LocalSchedulerState *state,
-                           TaskExecutionSpec &execution_spec,
-                           LocalSchedulerClient *worker) {
-  int64_t task_spec_size = execution_spec.SpecSize();
-  TaskSpec *spec = execution_spec.Spec();
-  // Acquire the necessary resources for running this task.
-  const std::unordered_map<std::string, double> required_resources =
-      TaskSpec_get_required_resources(spec);
-  acquire_resources(state, worker, required_resources);
-  // Check that actor tasks don't have non-CPU requirements. Any necessary
-  // non-CPU resources (in particular, GPUs) should already have been acquired
-  // by the actor worker.
-  if (!worker->actor_id.is_nil()) {
-    RAY_CHECK(required_resources.size() == 1);
-    RAY_CHECK(required_resources.count("CPU") == 1);
-  }
-
-  RAY_CHECK(worker->actor_id == TaskSpec_actor_id(spec));
-  /* Make sure the driver for this task is still alive. */
-  WorkerID driver_id = TaskSpec_driver_id(spec);
-  RAY_CHECK(is_driver_alive(state, driver_id));
-
-  /* Construct a flatbuffer object to send to the worker. */
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = ray::local_scheduler::protocol::CreateGetTaskReply(
-      fbb, fbb.CreateString((char *) spec, task_spec_size),
-      fbb.CreateVector(worker->gpus_in_use));
-  fbb.Finish(message);
-
-  if (write_message(worker->sock,
-                    static_cast<int64_t>(MessageType::ExecuteTask),
-                    fbb.GetSize(), (uint8_t *) fbb.GetBufferPointer()) < 0) {
-    if (errno == EPIPE || errno == EBADF) {
-      /* Something went wrong, so kill the worker. */
-      kill_worker(state, worker, false, false);
-      RAY_LOG(WARNING) << "Failed to give task to worker on fd " << worker->sock
-                       << ". The client may have hung up.";
-    } else {
-      RAY_LOG(FATAL) << "Failed to give task to client on fd " << worker->sock;
-    }
-  }
-
-  Task *task =
-      Task_alloc(execution_spec, TaskStatus::RUNNING,
-                 state->db ? get_db_client_id(state->db) : DBClientID::nil());
-  /* Record which task this worker is executing. This will be freed in
-   * process_message when the worker sends a GetTask message to the local
-   * scheduler. */
-  worker->task_in_progress = Task_copy(task);
-  /* Update the global task table. */
-  if (state->db != NULL) {
-    task_table_update(state->db, task, NULL, NULL, NULL);
-  } else {
-    Task_free(task);
-  }
-}
-
-// This is used to allow task_table_update to fail.
-void allow_task_table_update_failure(UniqueID id,
-                                     void *user_context,
-                                     void *user_data) {}
-
-void finish_task(LocalSchedulerState *state, LocalSchedulerClient *worker) {
-  if (worker->task_in_progress != NULL) {
-    TaskSpec *spec = Task_task_execution_spec(worker->task_in_progress)->Spec();
-    // Return dynamic resources back for the task in progress.
-    if (TaskSpec_is_actor_creation_task(spec)) {
-      // Resources required by the actor creation task are acquired for the
-      // actor's lifetime, so don't return anything here. TODO(rkn): Should the
-      // actor creation task require 1 CPU in addition to any resources acquired
-      // for the lifetime of the actor? If not, then the local scheduler may
-      // schedule an arbitrary number of actor creation tasks concurrently (if
-      // they don't acquire any resources for their entire lifetime). In
-      // practice this will usually be rate-limited by the rate at which we can
-      // create new workers.
-
-      ActorID actor_creation_id = TaskSpec_actor_creation_id(spec);
-      WorkerID driver_id = TaskSpec_driver_id(spec);
-
-      // The driver must be alive because if the driver had been removed, then
-      // this worker would have been killed (because it was executing a task for
-      // the driver).
-      RAY_CHECK(is_driver_alive(state, driver_id));
-
-      // Update the worker struct with this actor ID.
-      RAY_CHECK(worker->actor_id.is_nil());
-      worker->actor_id = actor_creation_id;
-      // Extract the initial execution dependency from the actor creation task.
-      RAY_CHECK(TaskSpec_num_returns(spec) == 1);
-      ObjectID initial_execution_dependency = TaskSpec_return(spec, 0);
-      // Let the scheduling algorithm process the presence of this new worker.
-      handle_convert_worker_to_actor(state, state->algorithm_state,
-                                     actor_creation_id,
-                                     initial_execution_dependency, worker);
-      // Publish the actor creation notification. The corresponding callback
-      // handle_actor_creation_callback will update state->actor_mapping.
-      publish_actor_creation_notification(
-          state->db, actor_creation_id, driver_id, get_db_client_id(state->db));
-    } else if (worker->actor_id.is_nil()) {
-      // Return dynamic resources back for the task in progress.
-      RAY_CHECK(worker->resources_in_use["CPU"] ==
-                TaskSpec_get_required_resource(spec, "CPU"));
-      // Return GPU resources.
-      RAY_CHECK(worker->gpus_in_use.size() ==
-                TaskSpec_get_required_resource(spec, "GPU"));
-      release_resources(state, worker, worker->resources_in_use);
-    } else {
-      // Actor tasks should only specify CPU requirements.
-      RAY_CHECK(0 == TaskSpec_get_required_resource(spec, "GPU"));
-      std::unordered_map<std::string, double> cpu_resources;
-      cpu_resources["CPU"] = TaskSpec_get_required_resource(spec, "CPU");
-      release_resources(state, worker, cpu_resources);
-    }
-    /* If we're connected to Redis, update tables. */
-    if (state->db != NULL) {
-      /* Update control state tables. */
-      TaskStatus task_state = TaskStatus::DONE;
-      Task_set_state(worker->task_in_progress, task_state);
-      auto retryInfo = RetryInfo{
-          .num_retries = 0,  // This value is unused.
-          .timeout = 0,      // This value is unused.
-          .fail_callback = allow_task_table_update_failure,
-      };
-
-      // We allow this call to fail in case the driver has been removed and the
-      // task table entries have already been cleaned up by the monitor.
-      task_table_update(state->db, worker->task_in_progress, &retryInfo, NULL,
-                        NULL);
-    } else {
-      Task_free(worker->task_in_progress);
-    }
-    /* The call to task_table_update takes ownership of the
-     * task_in_progress, so we set the pointer to NULL so it is not used. */
-    worker->task_in_progress = NULL;
-  }
-}
-
-void process_plasma_notification(event_loop *loop,
-                                 int client_sock,
-                                 void *context,
-                                 int events) {
-  LocalSchedulerState *state = (LocalSchedulerState *) context;
-  /* Read the notification from Plasma. */
-  uint8_t *notification = read_message_async(loop, client_sock);
-  if (!notification) {
-    /* The store has closed the socket. */
-    LocalSchedulerState_free(state);
-    RAY_LOG(FATAL) << "Lost connection to the plasma store, local scheduler is "
-                   << "exiting!";
-  }
-  auto object_info = flatbuffers::GetRoot<ObjectInfo>(notification);
-  ObjectID object_id = from_flatbuf(*object_info->object_id());
-  if (object_info->is_deletion()) {
-    handle_object_removed(state, object_id);
-  } else {
-    handle_object_available(state, state->algorithm_state, object_id);
-  }
-  free(notification);
-}
-
-void reconstruct_task_update_callback(Task *task,
-                                      void *user_context,
-                                      bool updated) {
-  LocalSchedulerState *state = (LocalSchedulerState *) user_context;
-  if (!updated) {
-    /* The test-and-set failed. The task is either: (1) not finished yet, (2)
-     * lost, but not yet updated, or (3) already being reconstructed. */
-    DBClientID current_local_scheduler_id = Task_local_scheduler(task);
-    if (!current_local_scheduler_id.is_nil()) {
-      DBClient current_local_scheduler =
-          db_client_table_cache_get(state->db, current_local_scheduler_id);
-      if (!current_local_scheduler.is_alive) {
-        /* (2) The current local scheduler for the task is dead. The task is
-         * lost, but the task table hasn't received the update yet. Retry the
-         * test-and-set. */
-        task_table_test_and_update(state->db, Task_task_id(task),
-                                   current_local_scheduler_id, Task_state(task),
-                                   TaskStatus::RECONSTRUCTING, NULL,
-                                   reconstruct_task_update_callback, state);
-      }
-    }
-    /* The test-and-set failed, so it is not safe to resubmit the task for
-     * execution. Suppress the request. */
-    return;
-  }
-
-  /* Otherwise, the test-and-set succeeded, so resubmit the task for execution
-   * to ensure that reconstruction will happen. */
-  TaskExecutionSpec *execution_spec = Task_task_execution_spec(task);
-  TaskSpec *spec = execution_spec->Spec();
-  if (TaskSpec_actor_id(spec).is_nil()) {
-    handle_task_submitted(state, state->algorithm_state, *execution_spec);
-  } else {
-    handle_actor_task_submitted(state, state->algorithm_state, *execution_spec);
-  }
-
-  /* Recursively reconstruct the task's inputs, if necessary. */
-  int64_t num_dependencies = execution_spec->NumDependencies();
-  for (int64_t i = 0; i < num_dependencies; ++i) {
-    int count = execution_spec->DependencyIdCount(i);
-    for (int64_t j = 0; j < count; ++j) {
-      ObjectID dependency_id = execution_spec->DependencyId(i, j);
-      reconstruct_object(state, dependency_id);
-    }
-  }
-}
-
-void reconstruct_put_task_update_callback(Task *task,
-                                          void *user_context,
-                                          bool updated) {
-  LocalSchedulerState *state = (LocalSchedulerState *) user_context;
-  if (!updated) {
-    /* The test-and-set failed. The task is either: (1) not finished yet, (2)
-     * lost, but not yet updated, or (3) already being reconstructed. */
-    DBClientID current_local_scheduler_id = Task_local_scheduler(task);
-    if (!current_local_scheduler_id.is_nil()) {
-      DBClient current_local_scheduler =
-          db_client_table_cache_get(state->db, current_local_scheduler_id);
-      if (!current_local_scheduler.is_alive) {
-        /* (2) The current local scheduler for the task is dead. The task is
-         * lost, but the task table hasn't received the update yet. Retry the
-         * test-and-set. */
-        task_table_test_and_update(state->db, Task_task_id(task),
-                                   current_local_scheduler_id, Task_state(task),
-                                   TaskStatus::RECONSTRUCTING, NULL,
-                                   reconstruct_put_task_update_callback, state);
-      } else if (Task_state(task) == TaskStatus::RUNNING) {
-        /* (1) The task is still executing on a live node. The object created
-         * by `ray.put` was not able to be reconstructed, and the workload will
-         * likely hang. Push an error to the appropriate driver. */
-        TaskSpec *spec = Task_task_execution_spec(task)->Spec();
-
-        std::ostringstream error_message;
-        error_message << "The task with ID " << TaskSpec_task_id(spec)
-                      << " is still executing and so the object created by "
-                      << "ray.put could not be reconstructed.";
-        push_error(state->db, TaskSpec_driver_id(spec),
-                   ErrorIndex::PUT_RECONSTRUCTION, error_message.str());
-      }
-    } else {
-      /* (1) The task is still executing and it is the driver task. We cannot
-       * restart the driver task, so the workload will hang. Push an error to
-       * the appropriate driver. */
-      TaskSpec *spec = Task_task_execution_spec(task)->Spec();
-
-      std::ostringstream error_message;
-      error_message << "The task with ID " << TaskSpec_task_id(spec)
-                    << " is a driver task and so the object created by ray.put "
-                    << "could not be reconstructed.";
-      push_error(state->db, TaskSpec_driver_id(spec),
-                 ErrorIndex::PUT_RECONSTRUCTION, error_message.str());
-    }
-  } else {
-    /* The update to TaskStatus::RECONSTRUCTING succeeded, so continue with
-     * reconstruction as usual. */
-    reconstruct_task_update_callback(task, user_context, updated);
-  }
-}
-
-void reconstruct_evicted_result_lookup_callback(ObjectID reconstruct_object_id,
-                                                TaskID task_id,
-                                                bool is_put,
-                                                void *user_context) {
-  RAY_CHECK(!task_id.is_nil())
-      << "No task information found for object during reconstruction";
-  LocalSchedulerState *state = (LocalSchedulerState *) user_context;
-
-  task_table_test_and_update_callback done_callback;
-  if (is_put) {
-    /* If the evicted object was created through ray.put and the originating
-     * task
-     * is still executing, it's very likely that the workload will hang and the
-     * worker needs to be restarted. Else, the reconstruction behavior is the
-     * same as for other evicted objects */
-    done_callback = reconstruct_put_task_update_callback;
-  } else {
-    done_callback = reconstruct_task_update_callback;
-  }
-  /* If there are no other instances of the task running, it's safe for us to
-   * claim responsibility for reconstruction. */
-  task_table_test_and_update(state->db, task_id, DBClientID::nil(),
-                             (TaskStatus::DONE | TaskStatus::LOST),
-                             TaskStatus::RECONSTRUCTING, NULL, done_callback,
-                             state);
-}
-
-void reconstruct_failed_result_lookup_callback(ObjectID reconstruct_object_id,
-                                               TaskID task_id,
-                                               bool is_put,
-                                               void *user_context) {
-  if (task_id.is_nil()) {
-    /* NOTE(swang): For some reason, the result table update sometimes happens
-     * after this lookup returns, possibly due to concurrent clients. In most
-     * cases, this is okay because the initial execution is probably still
-     * pending, so for now, we log a warning and suppress reconstruction. */
-    RAY_LOG(WARNING) << "No task information found for object during "
-                     << "reconstruction (no object entry yet)";
-    return;
-  }
-  LocalSchedulerState *state = (LocalSchedulerState *) user_context;
-  /* If the task failed to finish, it's safe for us to claim responsibility for
-   * reconstruction. */
-  task_table_test_and_update(state->db, task_id, DBClientID::nil(),
-                             TaskStatus::LOST, TaskStatus::RECONSTRUCTING, NULL,
-                             reconstruct_task_update_callback, state);
-}
-
-void reconstruct_object_lookup_callback(
-    ObjectID reconstruct_object_id,
-    bool never_created,
-    const std::vector<DBClientID> &manager_ids,
-    void *user_context) {
-  RAY_LOG(DEBUG) << "Manager count was " << manager_ids.size();
-  /* Only continue reconstruction if we find that the object doesn't exist on
-   * any nodes. NOTE: This codepath is not responsible for checking if the
-   * object table entry is up-to-date. */
-  LocalSchedulerState *state = (LocalSchedulerState *) user_context;
-  /* Look up the task that created the object in the result table. */
-  if (never_created) {
-    /* If the object has not been created yet, we reconstruct the object if and
-     * only if the task that created the object failed to complete. */
-    result_table_lookup(state->db, reconstruct_object_id, NULL,
-                        reconstruct_failed_result_lookup_callback,
-                        (void *) state);
-  } else {
-    /* If the object has been created, filter out the dead plasma managers that
-     * have it. */
-    size_t num_live_managers = 0;
-    for (auto manager_id : manager_ids) {
-      DBClient manager = db_client_table_cache_get(state->db, manager_id);
-      if (manager.is_alive) {
-        num_live_managers++;
-      }
-    }
-    /* If the object was created, but all plasma managers that had the object
-     * either evicted it or failed, we reconstruct the object if and only if
-     * there are no other instances of the task running. */
-    if (num_live_managers == 0) {
-      result_table_lookup(state->db, reconstruct_object_id, NULL,
-                          reconstruct_evicted_result_lookup_callback,
-                          (void *) state);
-    }
-  }
-}
-
-void reconstruct_object(LocalSchedulerState *state,
-                        ObjectID reconstruct_object_id) {
-  RAY_LOG(DEBUG) << "Starting reconstruction";
-  /* If the object is locally available, no need to reconstruct. */
-  if (object_locally_available(state->algorithm_state, reconstruct_object_id)) {
-    return;
-  }
-  /* Determine if reconstruction is necessary by checking if the object exists
-   * on a node. */
-  RAY_CHECK(state->db != NULL);
-  object_table_lookup(state->db, reconstruct_object_id, NULL,
-                      reconstruct_object_lookup_callback, (void *) state);
-}
-
-void handle_client_register(
-    LocalSchedulerState *state,
-    LocalSchedulerClient *worker,
-    const ray::local_scheduler::protocol::RegisterClientRequest *message) {
-  /* Make sure this worker hasn't already registered. */
-  RAY_CHECK(!worker->registered);
-  worker->registered = true;
-  worker->is_worker = message->is_worker();
-  RAY_CHECK(worker->client_id.is_nil());
-  worker->client_id = from_flatbuf(*message->client_id());
-
-  /* Register the worker or driver. */
-  if (worker->is_worker) {
-    /* Update the actor mapping with the actor ID of the worker (if an actor is
-     * running on the worker). */
-    worker->pid = message->worker_pid();
-    /* Register worker process id with the scheduler. */
-    /* Determine if this worker is one of our child processes. */
-    RAY_LOG(DEBUG) << "PID is " << worker->pid;
-    auto it = std::find(state->child_pids.begin(), state->child_pids.end(),
-                        worker->pid);
-    if (it != state->child_pids.end()) {
-      /* If this worker is one of our child processes, mark it as a child so
-       * that we know that we can wait for the process to exit during
-       * cleanup. */
-      worker->is_child = true;
-      state->child_pids.erase(it);
-      RAY_LOG(DEBUG) << "Found matching child pid " << worker->pid;
-    }
-  } else {
-    /* Register the driver. Currently we don't do anything here. */
-  }
-}
-
-void handle_driver_removed_callback(WorkerID driver_id, void *user_context) {
-  LocalSchedulerState *state = (LocalSchedulerState *) user_context;
-
-  /* Kill any actors that were created by the removed driver, and kill any
-   * workers that are currently running tasks from the dead driver. */
-  auto it = state->workers.begin();
-  while (it != state->workers.end()) {
-    /* Increment the iterator by one before calling kill_worker, because
-     * kill_worker will invalidate the iterator. Note that this requires
-     * knowledge of the particular container that we are iterating over (in this
-     * case it is a list). */
-    auto next_it = it;
-    next_it++;
-
-    ActorID actor_id = (*it)->actor_id;
-    Task *task = (*it)->task_in_progress;
-
-    if (!actor_id.is_nil()) {
-      /* This is an actor. */
-      RAY_CHECK(state->actor_mapping.count(actor_id) == 1);
-      if (state->actor_mapping[actor_id].driver_id == driver_id) {
-        /* This actor was created by the removed driver, so kill the actor. */
-        RAY_LOG(DEBUG) << "Killing an actor for a removed driver.";
-        kill_worker(state, *it, false, true);
-      }
-    } else if (task != NULL) {
-      TaskSpec *spec = Task_task_execution_spec(task)->Spec();
-      if (TaskSpec_driver_id(spec) == driver_id) {
-        RAY_LOG(DEBUG) << "Killing a worker executing a task for a removed "
-                       << "driver.";
-        kill_worker(state, *it, false, true);
-      }
-    }
-
-    it = next_it;
-  }
-
-  /* Add the driver to a list of dead drivers. */
-  state->removed_drivers.insert(driver_id);
-
-  /* Notify the scheduling algorithm that the driver has been removed. It should
-   * remove tasks for that driver from its data structures. */
-  handle_driver_removed(state, state->algorithm_state, driver_id);
-}
-
-void handle_client_disconnect(LocalSchedulerState *state,
-                              LocalSchedulerClient *worker) {
-  if (!worker->registered || worker->is_worker) {
-  } else {
-    /* In this case, a driver is disconecting. */
-    driver_table_send_driver_death(state->db, worker->client_id, NULL);
-  }
-  /* Suppress the warning message if the worker already disconnected. */
-  kill_worker(state, worker, false, worker->disconnected);
-}
-
-void handle_get_actor_frontier(LocalSchedulerState *state,
-                               LocalSchedulerClient *worker,
-                               ActorID actor_id) {
-  auto task_counters =
-      get_actor_task_counters(state->algorithm_state, actor_id);
-  auto frontier = get_actor_frontier(state->algorithm_state, actor_id);
-
-  /* Build the ActorFrontier flatbuffer. */
-  std::vector<ActorHandleID> handle_vector;
-  std::vector<int64_t> task_counter_vector;
-  std::vector<ObjectID> frontier_vector;
-  for (auto handle : task_counters) {
-    handle_vector.push_back(handle.first);
-    task_counter_vector.push_back(handle.second);
-    frontier_vector.push_back(frontier[handle.first]);
-  }
-  flatbuffers::FlatBufferBuilder fbb;
-  auto reply = ray::local_scheduler::protocol::CreateActorFrontier(
-      fbb, to_flatbuf(fbb, actor_id), to_flatbuf(fbb, handle_vector),
-      fbb.CreateVector(task_counter_vector), to_flatbuf(fbb, frontier_vector));
-  fbb.Finish(reply);
-  /* Respond with the built ActorFrontier. */
-  if (write_message(worker->sock,
-                    static_cast<int64_t>(MessageType::GetActorFrontierReply),
-                    fbb.GetSize(), (uint8_t *) fbb.GetBufferPointer()) < 0) {
-    if (errno == EPIPE || errno == EBADF) {
-      /* Something went wrong, so kill the worker. */
-      kill_worker(state, worker, false, false);
-      RAY_LOG(WARNING) << "Failed to return actor frontier to worker on fd "
-                       << worker->sock << ". The client may have hung up.";
-    } else {
-      RAY_LOG(FATAL) << "Failed to give task to client on fd " << worker->sock;
-    }
-  }
-}
-
-void handle_set_actor_frontier(
-    LocalSchedulerState *state,
-    LocalSchedulerClient *worker,
-    ray::local_scheduler::protocol::ActorFrontier const &frontier) {
-  /* Parse the ActorFrontier flatbuffer. */
-  ActorID actor_id = from_flatbuf(*frontier.actor_id());
-  std::unordered_map<ActorID, int64_t> task_counters;
-  std::unordered_map<ActorID, ObjectID> frontier_dependencies;
-  for (size_t i = 0; i < frontier.handle_ids()->size(); ++i) {
-    ActorID handle_id = from_flatbuf(*frontier.handle_ids()->Get(i));
-    task_counters[handle_id] = frontier.task_counters()->Get(i);
-    frontier_dependencies[handle_id] =
-        from_flatbuf(*frontier.frontier_dependencies()->Get(i));
-  }
-  /* Set the actor's frontier. */
-  set_actor_task_counters(state->algorithm_state, actor_id, task_counters);
-  set_actor_frontier(state, state->algorithm_state, actor_id,
-                     frontier_dependencies);
-}
-
-void process_message(event_loop *loop,
-                     int client_sock,
-                     void *context,
-                     int events) {
-  int64_t start_time = current_time_ms();
-
-  LocalSchedulerClient *worker = (LocalSchedulerClient *) context;
-  LocalSchedulerState *state = worker->local_scheduler_state;
-
-  int64_t type;
-  read_vector(client_sock, &type, state->input_buffer);
-  uint8_t *input = state->input_buffer.data();
-
-  RAY_LOG(DEBUG) << "New event of type " << type;
-
-  switch (type) {
-  case static_cast<int64_t>(MessageType::SubmitTask): {
-    auto message =
-        flatbuffers::GetRoot<ray::local_scheduler::protocol::SubmitTaskRequest>(
-            input);
-    TaskExecutionSpec execution_spec =
-        TaskExecutionSpec(from_flatbuf(*message->execution_dependencies()),
-                          (TaskSpec *) message->task_spec()->data(),
-                          message->task_spec()->size());
-    /* Set the tasks's local scheduler entrypoint time. */
-    execution_spec.SetLastTimeStamp(current_time_ms());
-    TaskSpec *spec = execution_spec.Spec();
-    /* Update the result table, which holds mappings of object ID -> ID of the
-     * task that created it. */
-    if (state->db != NULL) {
-      TaskID task_id = TaskSpec_task_id(spec);
-      for (int64_t i = 0; i < TaskSpec_num_returns(spec); ++i) {
-        ObjectID return_id = TaskSpec_return(spec, i);
-        result_table_add(state->db, return_id, task_id, false, NULL, NULL,
-                         NULL);
-      }
-    }
-
-    /* Handle the task submission. */
-    if (TaskSpec_actor_id(spec).is_nil()) {
-      handle_task_submitted(state, state->algorithm_state, execution_spec);
-    } else {
-      handle_actor_task_submitted(state, state->algorithm_state,
-                                  execution_spec);
-    }
-  } break;
-  case static_cast<int64_t>(MessageType::TaskDone): {
-  } break;
-  case static_cast<int64_t>(MessageType::DisconnectClient): {
-    finish_task(state, worker);
-    RAY_CHECK(!worker->disconnected);
-    worker->disconnected = true;
-    /* If the disconnected worker was not an actor, start a new worker to make
-     * sure there are enough workers in the pool. */
-    if (worker->actor_id.is_nil()) {
-      start_worker(state);
-    }
-  } break;
-  case static_cast<int64_t>(MessageType::EventLogMessage): {
-    /* Parse the message. */
-    auto message =
-        flatbuffers::GetRoot<ray::local_scheduler::protocol::EventLogMessage>(
-            input);
-    if (state->db != NULL) {
-      RayLogger_log_event(state->db, (uint8_t *) message->key()->data(),
-                          message->key()->size(),
-                          (uint8_t *) message->value()->data(),
-                          message->value()->size(), message->timestamp());
-    }
-  } break;
-  case static_cast<int64_t>(MessageType::RegisterClientRequest): {
-    auto message = flatbuffers::GetRoot<
-        ray::local_scheduler::protocol::RegisterClientRequest>(input);
-    handle_client_register(state, worker, message);
-  } break;
-  case static_cast<int64_t>(MessageType::GetTask): {
-    /* If this worker reports a completed task, account for resources. */
-    finish_task(state, worker);
-    /* Let the scheduling algorithm process the fact that there is an available
-     * worker. */
-    if (worker->actor_id.is_nil()) {
-      handle_worker_available(state, state->algorithm_state, worker);
-    } else {
-      handle_actor_worker_available(state, state->algorithm_state, worker);
-    }
-  } break;
-  case static_cast<int64_t>(MessageType::ReconstructObjects): {
-    auto message = flatbuffers::GetRoot<
-        ray::local_scheduler::protocol::ReconstructObjects>(input);
-    RAY_CHECK(!message->fetch_only());
-    if (worker->task_in_progress != NULL && !worker->is_blocked) {
-      /* If the worker was executing a task (i.e. non-driver) and it wasn't
-       * already blocked on an object that's not locally available, update its
-       * state to blocked. */
-      worker->is_blocked = true;
-      // Return the CPU resources that the blocked worker was using, but not
-      // other resources. If the worker is an actor, this will not return the
-      // CPU resources that the worker has acquired for its lifetime. It will
-      // only return the ones associated with the current method.
-      TaskSpec *spec =
-          Task_task_execution_spec(worker->task_in_progress)->Spec();
-      std::unordered_map<std::string, double> cpu_resources;
-      cpu_resources["CPU"] = TaskSpec_get_required_resource(spec, "CPU");
-      release_resources(state, worker, cpu_resources);
-      /* Let the scheduling algorithm process the fact that the worker is
-       * blocked. */
-      if (worker->actor_id.is_nil()) {
-        handle_worker_blocked(state, state->algorithm_state, worker);
-      } else {
-        handle_actor_worker_blocked(state, state->algorithm_state, worker);
-      }
-      print_worker_info("Reconstructing", state->algorithm_state);
-    }
-    RAY_CHECK(message->object_ids()->size() == 1);
-    ObjectID object_id = from_flatbuf(*message->object_ids()->Get(0));
-    reconstruct_object(state, object_id);
-  } break;
-  case static_cast<int64_t>(CommonMessageType::DISCONNECT_CLIENT): {
-    RAY_LOG(DEBUG) << "Disconnecting client on fd " << client_sock;
-    handle_client_disconnect(state, worker);
-  } break;
-  case static_cast<int64_t>(MessageType::NotifyUnblocked): {
-    /* TODO(rkn): A driver may call this as well, right? */
-    if (worker->task_in_progress != NULL) {
-      /* If the worker was executing a task (i.e. non-driver), update its
-       * state to not blocked. */
-      RAY_CHECK(worker->is_blocked);
-      worker->is_blocked = false;
-      /* Lease back the CPU resources that the blocked worker needs (note that
-       * it never released its GPU resources). TODO(swang): Leasing back the
-       * resources to blocked workers can cause us to transiently exceed the
-       * maximum number of resources. This could be fixed by having blocked
-       * workers explicitly yield and wait to be given back resources before
-       * continuing execution. */
-      TaskSpec *spec =
-          Task_task_execution_spec(worker->task_in_progress)->Spec();
-      std::unordered_map<std::string, double> cpu_resources;
-      cpu_resources["CPU"] = TaskSpec_get_required_resource(spec, "CPU");
-      acquire_resources(state, worker, cpu_resources);
-      /* Let the scheduling algorithm process the fact that the worker is
-       * unblocked. */
-      if (worker->actor_id.is_nil()) {
-        handle_worker_unblocked(state, state->algorithm_state, worker);
-      } else {
-        handle_actor_worker_unblocked(state, state->algorithm_state, worker);
-      }
-    }
-    print_worker_info("Worker unblocked", state->algorithm_state);
-  } break;
-  case static_cast<int64_t>(MessageType::PutObject): {
-    auto message =
-        flatbuffers::GetRoot<ray::local_scheduler::protocol::PutObject>(input);
-    result_table_add(state->db, from_flatbuf(*message->object_id()),
-                     from_flatbuf(*message->task_id()), true, NULL, NULL, NULL);
-  } break;
-  case static_cast<int64_t>(MessageType::GetActorFrontierRequest): {
-    auto message = flatbuffers::GetRoot<
-        ray::local_scheduler::protocol::GetActorFrontierRequest>(input);
-    ActorID actor_id = from_flatbuf(*message->actor_id());
-    handle_get_actor_frontier(state, worker, actor_id);
-  } break;
-  case static_cast<int64_t>(MessageType::SetActorFrontier): {
-    auto message =
-        flatbuffers::GetRoot<ray::local_scheduler::protocol::ActorFrontier>(
-            input);
-    handle_set_actor_frontier(state, worker, *message);
-  } break;
-  default:
-    /* This code should be unreachable. */
-    RAY_CHECK(0);
-  }
-
-  /* Print a warning if this method took too long. */
-  int64_t end_time = current_time_ms();
-  if (end_time - start_time >
-      RayConfig::instance().max_time_for_handler_milliseconds()) {
-    RAY_LOG(WARNING) << "process_message of type " << type << " took "
-                     << end_time - start_time << " milliseconds.";
-  }
-}
-
-void new_client_connection(event_loop *loop,
-                           int listener_sock,
-                           void *context,
-                           int events) {
-  LocalSchedulerState *state = (LocalSchedulerState *) context;
-  int new_socket = accept_client(listener_sock);
-  /* Create a struct for this worker. This will be freed when we free the local
-   * scheduler state. */
-  LocalSchedulerClient *worker = new LocalSchedulerClient();
-  worker->sock = new_socket;
-  worker->registered = false;
-  worker->disconnected = false;
-  /* We don't know whether this is a worker or not, so just initialize is_worker
-   * to false. */
-  worker->is_worker = true;
-  worker->client_id = WorkerID::nil();
-  worker->task_in_progress = NULL;
-  worker->is_blocked = false;
-  worker->pid = 0;
-  worker->is_child = false;
-  worker->actor_id = ActorID::nil();
-  worker->local_scheduler_state = state;
-  state->workers.push_back(worker);
-  event_loop_add_file(loop, new_socket, EVENT_LOOP_READ, process_message,
-                      worker);
-  RAY_LOG(DEBUG) << "new connection with fd " << new_socket;
-}
-
-/* We need this code so we can clean up when we get a SIGTERM signal. */
-
-LocalSchedulerState *g_state = NULL;
-
-void signal_handler(int signal) {
-  RAY_LOG(DEBUG) << "Signal was " << signal;
-  if (signal == SIGTERM) {
-    /* NOTE(swang): This call removes the SIGTERM handler to ensure that we
-     * free the local scheduler state at most once. If another SIGTERM is
-     * caught during this call, there is the possibility of orphan worker
-     * processes. */
-    if (g_state) {
-      LocalSchedulerState_free(g_state);
-    }
-    exit(0);
-  }
-}
-
-/* End of the cleanup code. */
-
-void handle_task_scheduled_callback(Task *original_task,
-                                    void *subscribe_context) {
-  LocalSchedulerState *state = (LocalSchedulerState *) subscribe_context;
-  TaskExecutionSpec *execution_spec = Task_task_execution_spec(original_task);
-  TaskSpec *spec = execution_spec->Spec();
-
-  /* Set the tasks's local scheduler entrypoint time. */
-  execution_spec->SetLastTimeStamp(current_time_ms());
-
-  /* If the driver for this task has been removed, then don't bother telling the
-   * scheduling algorithm. */
-  WorkerID driver_id = TaskSpec_driver_id(spec);
-  if (!is_driver_alive(state, driver_id)) {
-    RAY_LOG(DEBUG) << "Ignoring scheduled task for removed driver.";
-    return;
-  }
-
-  if (TaskSpec_actor_id(spec).is_nil()) {
-    /* This task does not involve an actor. Handle it normally. */
-    handle_task_scheduled(state, state->algorithm_state, *execution_spec);
-  } else {
-    /* This task involves an actor. Call the scheduling algorithm's actor
-     * handler. */
-    handle_actor_task_scheduled(state, state->algorithm_state, *execution_spec);
-  }
-}
-
-/**
- * Process a notification about the creation of a new actor. Use this to update
- * the mapping from actor ID to the local scheduler ID of the local scheduler
- * that is responsible for the actor. If this local scheduler is responsible for
- * the actor, then launch a new worker process to create that actor.
- *
- * @param actor_id The ID of the actor being created.
- * @param local_scheduler_id The ID of the local scheduler that is responsible
- *        for creating the actor.
- * @param context The context for this callback.
- * @return Void.
- */
-void handle_actor_creation_callback(const ActorID &actor_id,
-                                    const WorkerID &driver_id,
-                                    const DBClientID &local_scheduler_id,
-                                    void *context) {
-  LocalSchedulerState *state = (LocalSchedulerState *) context;
-
-  /* If the driver has been removed, don't bother doing anything. */
-  if (state->removed_drivers.count(driver_id) == 1) {
-    return;
-  }
-
-  // TODO(rkn): If we do not have perfect task suppression and it is possible
-  // for a task to be executed simultaneously on two nodes, then we will need to
-  // detect and handle that case.
-
-  if (state->actor_mapping.count(actor_id) != 0) {
-    // This actor already exists.
-    auto it = state->actor_mapping.find(actor_id);
-    if (it->second.local_scheduler_id == get_db_client_id(state->db)) {
-      // TODO(rkn): The actor was previously assigned to this local scheduler.
-      // We should kill the actor here if it is still around. Also, if it hasn't
-      // registered yet, we should keep track of its PID so we can kill it
-      // anyway.
-      // TODO(swang): Evict actor dummy objects as part of actor cleanup.
-    }
-  }
-
-  /* Create a new entry and add it to the actor mapping table. TODO(rkn):
-   * Currently this is never removed (except when the local scheduler state is
-   * deleted). */
-  ActorMapEntry entry;
-  entry.local_scheduler_id = local_scheduler_id;
-  entry.driver_id = driver_id;
-  state->actor_mapping[actor_id] = entry;
-
-  /* Let the scheduling algorithm process the fact that a new actor has been
-   * created. */
-  handle_actor_creation_notification(state, state->algorithm_state, actor_id);
-}
-
-int heartbeat_handler(event_loop *loop, timer_id id, void *context) {
-  LocalSchedulerState *state = (LocalSchedulerState *) context;
-  SchedulingAlgorithmState *algorithm_state = state->algorithm_state;
-
-  // Spillback policy invocation is synchronized with the heartbeats.
-  spillback_tasks_handler(state);
-
-  /* Check that the last heartbeat was not sent too long ago. */
-  int64_t current_time = current_time_ms();
-  RAY_CHECK(current_time >= state->previous_heartbeat_time);
-  if (current_time - state->previous_heartbeat_time >
-      RayConfig::instance().num_heartbeats_timeout() *
-          RayConfig::instance().heartbeat_timeout_milliseconds()) {
-    RAY_LOG(FATAL) << "The last heartbeat was sent "
-                   << current_time - state->previous_heartbeat_time
-                   << " milliseconds ago.";
-  }
-  state->previous_heartbeat_time = current_time;
-
-  LocalSchedulerInfo info;
-  /* Ask the scheduling algorithm to fill out the scheduler info struct. */
-  provide_scheduler_info(state, algorithm_state, &info);
-  /* Publish the heartbeat to all subscribers of the local scheduler table. */
-  local_scheduler_table_send_info(state->db, &info, NULL);
-  /* Reset the timer. */
-  return RayConfig::instance().heartbeat_timeout_milliseconds();
-}
-
-void start_server(
-    const char *node_ip_address,
-    const char *socket_name,
-    const char *redis_primary_addr,
-    int redis_primary_port,
-    const char *plasma_store_socket_name,
-    const char *plasma_manager_socket_name,
-    const char *plasma_manager_address,
-    bool global_scheduler_exists,
-    const std::unordered_map<std::string, double> &static_resource_conf,
-    const char *start_worker_command,
-    int num_workers) {
-  /* Ignore SIGPIPE signals. If we don't do this, then when we attempt to write
-   * to a client that has already died, the local scheduler could die. */
-  signal(SIGPIPE, SIG_IGN);
-  /* Ignore SIGCHLD signals. If we don't do this, then worker processes will
-   * become zombies instead of dying gracefully. */
-  signal(SIGCHLD, SIG_IGN);
-  int fd = bind_ipc_sock(socket_name, true);
-  event_loop *loop = event_loop_create();
-  g_state = LocalSchedulerState_init(
-      node_ip_address, loop, redis_primary_addr, redis_primary_port,
-      socket_name, plasma_store_socket_name, plasma_manager_socket_name,
-      plasma_manager_address, global_scheduler_exists, static_resource_conf,
-      start_worker_command, num_workers);
-  /* Register a callback for registering new clients. */
-  event_loop_add_file(loop, fd, EVENT_LOOP_READ, new_client_connection,
-                      g_state);
-  /* Subscribe to receive notifications about tasks that are assigned to this
-   * local scheduler by the global scheduler or by other local schedulers.
-   * TODO(rkn): we also need to get any tasks that were assigned to this local
-   * scheduler before the call to subscribe. */
-  if (g_state->db != NULL) {
-    task_table_subscribe(g_state->db, get_db_client_id(g_state->db),
-                         TaskStatus::SCHEDULED, handle_task_scheduled_callback,
-                         g_state, NULL, NULL, NULL);
-  }
-  /* Subscribe to notifications about newly created actors. */
-  if (g_state->db != NULL) {
-    actor_notification_table_subscribe(
-        g_state->db, handle_actor_creation_callback, g_state, NULL);
-  }
-  /* Subscribe to notifications about removed drivers. */
-  if (g_state->db != NULL) {
-    driver_table_subscribe(g_state->db, handle_driver_removed_callback, g_state,
-                           NULL);
-  }
-  /* Create a timer for publishing information about the load on the local
-   * scheduler to the local scheduler table. This message also serves as a
-   * heartbeat. */
-  if (g_state->db != NULL) {
-    event_loop_add_timer(loop,
-                         RayConfig::instance().heartbeat_timeout_milliseconds(),
-                         heartbeat_handler, g_state);
-  }
-  /* Listen for new and deleted db clients. */
-  if (g_state->db != NULL) {
-    db_client_table_cache_init(g_state->db);
-  }
-  /* Create a timer for fetching queued tasks' missing object dependencies. */
-  event_loop_add_timer(
-      loop, RayConfig::instance().local_scheduler_fetch_timeout_milliseconds(),
-      fetch_object_timeout_handler, g_state);
-  /* Create a timer for initiating the reconstruction of tasks' missing object
-   * dependencies. */
-  event_loop_add_timer(
-      loop, RayConfig::instance()
-                .local_scheduler_reconstruction_timeout_milliseconds(),
-      reconstruct_object_timeout_handler, g_state);
-  // Create a timer for rerunning actor creation tasks for actor tasks that are
-  // cached locally.
-  event_loop_add_timer(
-      loop, RayConfig::instance()
-                .local_scheduler_reconstruction_timeout_milliseconds(),
-      rerun_actor_creation_tasks_timeout_handler, g_state);
-  /* Run event loop. */
-  event_loop_run(loop);
-}
-
-/* Only declare the main function if we are not in testing mode, since the test
- * suite has its own declaration of main. */
-#ifndef LOCAL_SCHEDULER_TEST
-int main(int argc, char *argv[]) {
-  InitShutdownRAII ray_log_shutdown_raii(
-      ray::RayLog::StartRayLog, ray::RayLog::ShutDownRayLog, argv[0], RAY_INFO,
-      /*log_dir=*/"");
-  ray::RayLog::InstallFailureSignalHandler();
-  signal(SIGTERM, signal_handler);
-  /* Path of the listening socket of the local scheduler. */
-  char *scheduler_socket_name = NULL;
-  /* IP address and port of the primary redis instance. */
-  char *redis_primary_addr_port = NULL;
-  /* Socket name for the local Plasma store. */
-  char *plasma_store_socket_name = NULL;
-  /* Socket name for the local Plasma manager. */
-  char *plasma_manager_socket_name = NULL;
-  /* Address for the plasma manager associated with this local scheduler
-   * instance. */
-  char *plasma_manager_address = NULL;
-  /* The IP address of the node that this local scheduler is running on. */
-  char *node_ip_address = NULL;
-  /* Comma-separated list of configured resource capabilities for this node. */
-  char *static_resource_list = NULL;
-  std::unordered_map<std::string, double> static_resource_conf;
-  /* The command to run when starting new workers. */
-  char *start_worker_command = NULL;
-  /* The number of workers to start. */
-  char *num_workers_str = NULL;
-  int c;
-  bool global_scheduler_exists = true;
-  while ((c = getopt(argc, argv, "s:r:p:m:ga:h:c:w:n:")) != -1) {
-    switch (c) {
-    case 's':
-      scheduler_socket_name = optarg;
-      break;
-    case 'r':
-      redis_primary_addr_port = optarg;
-      break;
-    case 'p':
-      plasma_store_socket_name = optarg;
-      break;
-    case 'm':
-      plasma_manager_socket_name = optarg;
-      break;
-    case 'g':
-      global_scheduler_exists = false;
-      break;
-    case 'a':
-      plasma_manager_address = optarg;
-      break;
-    case 'h':
-      node_ip_address = optarg;
-      break;
-    case 'c':
-      static_resource_list = optarg;
-      break;
-    case 'w':
-      start_worker_command = optarg;
-      break;
-    case 'n':
-      num_workers_str = optarg;
-      break;
-    default:
-      RAY_LOG(FATAL) << "unknown option " << c;
-    }
-  }
-  if (!static_resource_list) {
-    RAY_LOG(FATAL) << "please specify a static resource list with the -c "
-                   << "switch";
-  }
-  // Parse the resource list.
-  std::istringstream resource_string(static_resource_list);
-  std::string resource_name;
-  std::string resource_quantity;
-
-  while (std::getline(resource_string, resource_name, ',')) {
-    RAY_CHECK(std::getline(resource_string, resource_quantity, ','));
-    // TODO(rkn): The line below could throw an exception. What should we do
-    // about this?
-    static_resource_conf[resource_name] = std::stod(resource_quantity);
-  }
-
-  if (!scheduler_socket_name) {
-    RAY_LOG(FATAL) << "please specify socket for incoming connections with "
-                   << "-s switch";
-  }
-  if (!plasma_store_socket_name) {
-    RAY_LOG(FATAL) << "please specify socket for connecting to Plasma store "
-                   << "with -p switch";
-  }
-  if (!node_ip_address) {
-    RAY_LOG(FATAL) << "please specify the node IP address with -h switch";
-  }
-  int num_workers = 0;
-  if (num_workers_str) {
-    num_workers = strtol(num_workers_str, NULL, 10);
-    if (num_workers < 0) {
-      RAY_LOG(FATAL) << "Number of workers must be nonnegative";
-    }
-  }
-
-  char redis_primary_addr[16];
-  char *redis_addr = NULL;
-  int redis_port = -1;
-  if (!redis_primary_addr_port) {
-    /* Start the local scheduler without connecting to Redis. In this case, all
-     * submitted tasks will be queued and scheduled locally. */
-    if (plasma_manager_socket_name) {
-      RAY_LOG(FATAL) << "if a plasma manager socket name is provided with the "
-                     << "-m switch, then a redis address must be provided with "
-                     << "the -r switch";
-    }
-  } else {
-    int redis_primary_port;
-    /* Parse the primary Redis address into an IP address and a port. */
-    if (parse_ip_addr_port(redis_primary_addr_port, redis_primary_addr,
-                           &redis_primary_port) == -1) {
-      RAY_LOG(FATAL) << "if a redis address is provided with the -r switch, it "
-                     << "should be formatted like 127.0.0.1:6379";
-    }
-    if (!plasma_manager_socket_name) {
-      RAY_LOG(FATAL) << "please specify socket for connecting to Plasma "
-                     << "manager with -m switch";
-    }
-    redis_addr = redis_primary_addr;
-    redis_port = redis_primary_port;
-  }
-
-  start_server(node_ip_address, scheduler_socket_name, redis_addr, redis_port,
-               plasma_store_socket_name, plasma_manager_socket_name,
-               plasma_manager_address, global_scheduler_exists,
-               static_resource_conf, start_worker_command, num_workers);
-}
-#endif
diff --git a/src/local_scheduler/local_scheduler.h b/src/local_scheduler/local_scheduler.h
deleted file mode 100644
index 39c7523fe7ed4..0000000000000
--- a/src/local_scheduler/local_scheduler.h
+++ /dev/null
@@ -1,176 +0,0 @@
-#ifndef LOCAL_SCHEDULER_H
-#define LOCAL_SCHEDULER_H
-
-#include "event_loop.h"
-#include "local_scheduler_shared.h"
-#include "task.h"
-
-/**
- * Establish a connection to a new client.
- *
- * @param loop Event loop of the local scheduler.
- * @param listener_socket Socket the local scheduler is listening on for new
- *        client requests.
- * @param context State of the local scheduler.
- * @param events Flag for events that are available on the listener socket.
- * @return Void.
- */
-void new_client_connection(event_loop *loop,
-                           int listener_sock,
-                           void *context,
-                           int events);
-
-/**
- * Check if a driver is still alive.
- *
- * @param driver_id The ID of the driver.
- * @return True if the driver is still alive and false otherwise.
- */
-bool is_driver_alive(WorkerID driver_id);
-
-/**
- * This function can be called by the scheduling algorithm to assign a task
- * to a worker.
- *
- * @param info
- * @param task The task that is submitted to the worker.
- * @param worker The worker to assign the task to.
- * @return Void.
- */
-void assign_task_to_worker(LocalSchedulerState *state,
-                           TaskExecutionSpec &task,
-                           LocalSchedulerClient *worker);
-
-/*
- * This function is called whenever a task has finished on one of the workers.
- * It updates the resource accounting and the global state store.
- *
- * @param state The local scheduler state.
- * @param worker The worker that finished the task.
- * @return Void.
- */
-void finish_task(LocalSchedulerState *state, LocalSchedulerClient *worker);
-
-/**
- * This is the callback that is used to process a notification from the Plasma
- * store that an object has been sealed.
- *
- * @param loop The local scheduler's event loop.
- * @param client_sock The file descriptor to read the notification from.
- * @param context The local scheduler state.
- * @param events
- * @return Void.
- */
-void process_plasma_notification(event_loop *loop,
-                                 int client_sock,
-                                 void *context,
-                                 int events);
-
-/**
- * Reconstruct an object. If the object does not exist on any nodes, according
- * to the state tables, and if the object is not already being reconstructed,
- * this triggers a single reexecution of the task that originally created the
- * object.
- *
- * @param state The local scheduler state.
- * @param object_id The ID of the object to reconstruct.
- * @return Void.
- */
-void reconstruct_object(LocalSchedulerState *state, ObjectID object_id);
-
-void print_resource_info(const LocalSchedulerState *s, const TaskSpec *spec);
-
-/**
- * Kill a worker, if it is a child process, and clean up all of its associated
- * state. Note that this function is also called on drivers, but it should not
- * actually send a kill signal to drivers.
- *
- * @param state The local scheduler state.
- * @param worker The local scheduler client to kill.
- * @param wait A boolean representing whether to wait for the killed worker to
- *        exit.
- * @param suppress_warning A bool that is true if we should not warn the driver,
- *        and false otherwise. This should only be true when a driver is
- *        removed.
- * @return Void.
- */
-void kill_worker(LocalSchedulerState *state,
-                 LocalSchedulerClient *worker,
-                 bool wait,
-                 bool suppress_warning);
-
-/**
- * Start a worker. This forks a new worker process that can be added to the
- * pool of available workers, pending registration of its PID with the local
- * scheduler.
- *
- * @param state The local scheduler state.
- * @param Void.
- */
-void start_worker(LocalSchedulerState *state);
-
-/**
- * Check if a certain quantity of dynamic resources are available. If num_cpus
- * is 0, we ignore the dynamic number of available CPUs (which may be negative).
- *
- * @param state The state of the local scheduler.
- * @param resources The resources to check.
- * @return True if there are enough CPUs and GPUs and false otherwise.
- */
-bool check_dynamic_resources(
-    LocalSchedulerState *state,
-    const std::unordered_map<std::string, double> &resources);
-
-/**
- * Acquire additional resources (CPUs and GPUs) for a worker.
- *
- * @param state The local scheduler state.
- * @param worker The worker who is acquiring resources.
- * @param resources The resources to acquire.
- * @return Void.
- */
-void acquire_resources(
-    LocalSchedulerState *state,
-    LocalSchedulerClient *worker,
-    const std::unordered_map<std::string, double> &resources);
-
-/**
- * Return resources (CPUs and GPUs) being used by a worker to the local
- * scheduler.
- *
- * @param state The local scheduler state.
- * @param worker The worker who is returning resources.
- * @param resources The resources to release.
- * @return Void.
- */
-void release_resources(
-    LocalSchedulerState *state,
-    LocalSchedulerClient *worker,
-    const std::unordered_map<std::string, double> &resources);
-
-/** The following methods are for testing purposes only. */
-#ifdef LOCAL_SCHEDULER_TEST
-LocalSchedulerState *LocalSchedulerState_init(
-    const char *node_ip_address,
-    event_loop *loop,
-    const char *redis_addr,
-    int redis_port,
-    const char *local_scheduler_socket_name,
-    const char *plasma_manager_socket_name,
-    const char *plasma_store_socket_name,
-    const char *plasma_manager_address,
-    bool global_scheduler_exists,
-    const std::unordered_map<std::string, double> &static_resource_vector,
-    const char *worker_path,
-    int num_workers);
-
-SchedulingAlgorithmState *get_algorithm_state(LocalSchedulerState *state);
-
-void process_message(event_loop *loop,
-                     int client_sock,
-                     void *context,
-                     int events);
-
-#endif
-
-#endif /* LOCAL_SCHEDULER_H */
diff --git a/src/local_scheduler/local_scheduler_algorithm.cc b/src/local_scheduler/local_scheduler_algorithm.cc
deleted file mode 100644
index 89d6c8d6df56c..0000000000000
--- a/src/local_scheduler/local_scheduler_algorithm.cc
+++ /dev/null
@@ -1,1851 +0,0 @@
-#include "local_scheduler_algorithm.h"
-
-#include <list>
-#include <vector>
-#include <unordered_map>
-
-#include "state/task_table.h"
-#include "state/actor_notification_table.h"
-#include "state/db_client_table.h"
-#include "state/error_table.h"
-#include "state/local_scheduler_table.h"
-#include "state/object_table.h"
-#include "local_scheduler_shared.h"
-#include "local_scheduler.h"
-#include "common/task.h"
-
-/* Declared for convenience. */
-void remove_actor(SchedulingAlgorithmState *algorithm_state, ActorID actor_id);
-
-void give_task_to_global_scheduler(LocalSchedulerState *state,
-                                   SchedulingAlgorithmState *algorithm_state,
-                                   TaskExecutionSpec &execution_spec);
-
-void give_task_to_local_scheduler(LocalSchedulerState *state,
-                                  SchedulingAlgorithmState *algorithm_state,
-                                  TaskExecutionSpec &execution_spec,
-                                  DBClientID local_scheduler_id);
-
-void clear_missing_dependencies(SchedulingAlgorithmState *algorithm_state,
-                                std::list<TaskExecutionSpec>::iterator it);
-
-/** A data structure used to track which objects are available locally and
- *  which objects are being actively fetched. Objects of this type are used for
- *  both the scheduling algorithm state's local_objects and remote_objects
- *  tables. An ObjectEntry should be in at most one of the tables and not both
- *  simultaneously. */
-struct ObjectEntry {
-  /** A vector of tasks dependent on this object. These tasks are a subset of
-   *  the tasks in the waiting queue. Each element actually stores a reference
-   *  to the corresponding task's queue entry in waiting queue, for fast
-   *  deletion when all of the task's dependencies become available. */
-  std::vector<std::list<TaskExecutionSpec>::iterator> dependent_tasks;
-  /** Whether or not to request a transfer of this object. This should be set
-   *  to true for all objects except for actor dummy objects, where the object
-   *  must be generated by executing the task locally. */
-  bool request_transfer;
-};
-
-/** This struct contains information about a specific actor. This struct will be
- *  used inside of a hash table. */
-typedef struct {
-  /** The number of tasks that have been executed on this actor so far, per
-   *  handle. This is used to guarantee execution of tasks on actors in the
-   *  order that the tasks were submitted, per handle. Tasks from different
-   *  handles to the same actor may be interleaved. */
-  std::unordered_map<ActorHandleID, int64_t> task_counters;
-  /** These are the execution dependencies that make up the frontier of the
-   *  actor's runnable tasks. For each actor handle, we store the object ID
-   *  that represents the execution dependency for the next runnable task
-   *  submitted by that handle. */
-  std::unordered_map<ActorHandleID, ObjectID> frontier_dependencies;
-  /** The return value of the most recently executed task. The next task to
-   *  execute should take this as an execution dependency at dispatch time. Set
-   *  to nil if there are no execution dependencies (e.g., this is the first
-   *  task to execute). */
-  ObjectID execution_dependency;
-  /** A queue of tasks to be executed on this actor. The tasks will be sorted by
-   *  the order of their actor counters. */
-  std::list<TaskExecutionSpec> *task_queue;
-  /** The worker that the actor is running on. */
-  LocalSchedulerClient *worker;
-  /** True if the worker is available and false otherwise. */
-  bool worker_available;
-} LocalActorInfo;
-
-/** Part of the local scheduler state that is maintained by the scheduling
- *  algorithm. */
-struct SchedulingAlgorithmState {
-  /** An array of pointers to tasks that are waiting for dependencies. */
-  std::list<TaskExecutionSpec> *waiting_task_queue;
-  /** An array of pointers to tasks whose dependencies are ready but that are
-   *  waiting to be assigned to a worker. */
-  std::list<TaskExecutionSpec> *dispatch_task_queue;
-  /** This is a hash table from actor ID to information about that actor. In
-   *  particular, a queue of tasks that are waiting to execute on that actor.
-   *  This is only used for actors that exist locally. */
-  std::unordered_map<ActorID, LocalActorInfo> local_actor_infos;
-  /** This is a set of the IDs of the actors that have tasks waiting to run.
-   *  The purpose is to make it easier to dispatch tasks without looping over
-   *  all of the actors. Note that this is an optimization and is not strictly
-   *  necessary. */
-  std::unordered_set<ActorID> actors_with_pending_tasks;
-  /** A vector of actor tasks that have been submitted but this local scheduler
-   *  doesn't know which local scheduler is responsible for them, so cannot
-   *  assign them to the correct local scheduler yet. Whenever a notification
-   *  about a new local scheduler arrives, we will resubmit all of these tasks
-   *  locally. */
-  std::vector<TaskExecutionSpec> cached_submitted_actor_tasks;
-  /** An array of pointers to workers in the worker pool. These are workers
-   *  that have registered a PID with us and that are now waiting to be
-   *  assigned a task to execute. */
-  std::vector<LocalSchedulerClient *> available_workers;
-  /** An array of pointers to workers that are currently executing a task,
-   *  unblocked. These are the workers that are leasing some number of
-   *  resources. */
-  std::vector<LocalSchedulerClient *> executing_workers;
-  /** An array of pointers to workers that are currently executing a task,
-   *  blocked on some object(s) that isn't available locally yet. These are the
-   *  workers that are executing a task, but that have temporarily returned the
-   *  task's required resources. */
-  std::vector<LocalSchedulerClient *> blocked_workers;
-  /** A hash map of the objects that are available in the local Plasma store.
-   *  The key is the object ID. This information could be a little stale. */
-  std::unordered_map<ObjectID, ObjectEntry> local_objects;
-  /** A hash map of the objects that are not available locally. These are
-   *  currently being fetched by this local scheduler. The key is the object
-   *  ID. Every local_scheduler_fetch_timeout_milliseconds, a Plasma fetch
-   *  request will be sent the object IDs in this table. Each entry also holds
-   *  an array of queued tasks that are dependent on it. */
-  std::unordered_map<ObjectID, ObjectEntry> remote_objects;
-};
-
-SchedulingAlgorithmState *SchedulingAlgorithmState_init(void) {
-  SchedulingAlgorithmState *algorithm_state = new SchedulingAlgorithmState();
-  /* Initialize the local data structures used for queuing tasks and workers. */
-  algorithm_state->waiting_task_queue = new std::list<TaskExecutionSpec>();
-  algorithm_state->dispatch_task_queue = new std::list<TaskExecutionSpec>();
-
-  return algorithm_state;
-}
-
-void SchedulingAlgorithmState_free(SchedulingAlgorithmState *algorithm_state) {
-  /* Free all of the tasks in the waiting queue. */
-  delete algorithm_state->waiting_task_queue;
-  /* Free all the tasks in the dispatch queue. */
-  delete algorithm_state->dispatch_task_queue;
-  /* Remove all of the remaining actors. */
-  while (algorithm_state->local_actor_infos.size() != 0) {
-    auto it = algorithm_state->local_actor_infos.begin();
-    ActorID actor_id = it->first;
-    remove_actor(algorithm_state, actor_id);
-  }
-  /* Free the algorithm state. */
-  delete algorithm_state;
-}
-
-/**
- * This is a helper method to check if a worker is in a vector of workers.
- *
- * @param worker_vector A vector of workers.
- * @param The worker to look for in the vector.
- * @return True if the worker is in the vector and false otherwise.
- */
-bool worker_in_vector(std::vector<LocalSchedulerClient *> &worker_vector,
-                      LocalSchedulerClient *worker) {
-  auto it = std::find(worker_vector.begin(), worker_vector.end(), worker);
-  return it != worker_vector.end();
-}
-
-/**
- * This is a helper method to remove a worker from a vector of workers if it is
- * present in the vector.
- *
- * @param worker_vector A vector of workers.
- * @param The worker to remove.
- * @return True if the worker was removed and false otherwise.
- */
-bool remove_worker_from_vector(
-    std::vector<LocalSchedulerClient *> &worker_vector,
-    LocalSchedulerClient *worker) {
-  /* Find the worker in the list of executing workers. */
-  auto it = std::find(worker_vector.begin(), worker_vector.end(), worker);
-  bool remove_worker = (it != worker_vector.end());
-  if (remove_worker) {
-    /* Remove the worker from the list of workers. */
-    using std::swap;
-    swap(*it, worker_vector.back());
-    worker_vector.pop_back();
-  }
-  return remove_worker;
-}
-
-void provide_scheduler_info(LocalSchedulerState *state,
-                            SchedulingAlgorithmState *algorithm_state,
-                            LocalSchedulerInfo *info) {
-  info->total_num_workers = state->workers.size();
-  /* TODO(swang): Provide separate counts for tasks that are waiting for
-   * dependencies vs tasks that are waiting to be assigned. */
-  int64_t waiting_task_queue_length =
-      algorithm_state->waiting_task_queue->size();
-  int64_t dispatch_task_queue_length =
-      algorithm_state->dispatch_task_queue->size();
-  info->task_queue_length =
-      waiting_task_queue_length + dispatch_task_queue_length;
-  info->available_workers = algorithm_state->available_workers.size();
-  /* Copy static and dynamic resource information. */
-  info->dynamic_resources = state->dynamic_resources;
-  info->static_resources = state->static_resources;
-}
-
-/**
- * Create the LocalActorInfo struct for an actor worker that this local
- * scheduler is responsible for. For a given actor, this will either be done
- * when the first task for that actor arrives or when the worker running that
- * actor connects to the local scheduler.
- *
- * @param algorithm_state The state of the scheduling algorithm.
- * @param actor_id The actor ID of the actor being created.
- * @param initial_execution_dependency The dummy object ID of the actor
- *        creation task.
- * @param worker The worker struct for the worker that is running this actor.
- *        If the worker struct has not been created yet (meaning that the worker
- *        that is running this actor has not registered with the local scheduler
- *        yet, and so create_actor is being called because a task for that actor
- *        has arrived), then this should be NULL.
- * @return Void.
- */
-void create_actor(SchedulingAlgorithmState *algorithm_state,
-                  const ActorID &actor_id,
-                  const ObjectID &initial_execution_dependency,
-                  LocalSchedulerClient *worker) {
-  LocalActorInfo entry;
-  entry.task_counters[ActorHandleID::nil()] = 0;
-  entry.frontier_dependencies[ActorHandleID::nil()] = ObjectID::nil();
-  /* The actor has not yet executed any tasks, so there are no execution
-   * dependencies for the next task to be scheduled. */
-  entry.execution_dependency = initial_execution_dependency;
-  entry.task_queue = new std::list<TaskExecutionSpec>();
-  entry.worker = worker;
-  entry.worker_available = false;
-  RAY_CHECK(algorithm_state->local_actor_infos.count(actor_id) == 0);
-  algorithm_state->local_actor_infos[actor_id] = entry;
-
-  /* Log some useful information about the actor that we created. */
-  RAY_LOG(DEBUG) << "Creating actor with ID " << actor_id;
-}
-
-void remove_actor(SchedulingAlgorithmState *algorithm_state, ActorID actor_id) {
-  RAY_CHECK(algorithm_state->local_actor_infos.count(actor_id) == 1);
-  LocalActorInfo &entry =
-      algorithm_state->local_actor_infos.find(actor_id)->second;
-
-  /* Log some useful information about the actor that we're removing. */
-  size_t count = entry.task_queue->size();
-  if (count > 0) {
-    RAY_LOG(WARNING) << "Removing actor with ID " << actor_id << " and "
-                     << count << " remaining tasks.";
-  }
-
-  entry.task_queue->clear();
-  delete entry.task_queue;
-  /* Remove the entry from the hash table. */
-  algorithm_state->local_actor_infos.erase(actor_id);
-
-  /* Remove the actor ID from the set of actors with pending tasks. */
-  algorithm_state->actors_with_pending_tasks.erase(actor_id);
-}
-
-/**
- * Dispatch a task to an actor if possible.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state The state of the scheduling algorithm.
- * @param actor_id The ID of the actor corresponding to the worker.
- * @return True if a task was dispatched to the actor and false otherwise.
- */
-bool dispatch_actor_task(LocalSchedulerState *state,
-                         SchedulingAlgorithmState *algorithm_state,
-                         ActorID actor_id) {
-  /* Make sure this worker actually is an actor. */
-  RAY_CHECK(!actor_id.is_nil());
-  /* Return if this actor doesn't have any pending tasks. */
-  if (algorithm_state->actors_with_pending_tasks.find(actor_id) ==
-      algorithm_state->actors_with_pending_tasks.end()) {
-    return false;
-  }
-  /* Make sure this actor belongs to this local scheduler. */
-  if (state->actor_mapping.count(actor_id) != 1) {
-    /* The creation notification for this actor has not yet arrived at the local
-     * scheduler. This should be rare. */
-    return false;
-  }
-  RAY_CHECK(state->actor_mapping[actor_id].local_scheduler_id ==
-            get_db_client_id(state->db));
-
-  /* Get the local actor entry for this actor. */
-  RAY_CHECK(algorithm_state->local_actor_infos.count(actor_id) != 0);
-  LocalActorInfo &entry =
-      algorithm_state->local_actor_infos.find(actor_id)->second;
-
-  /* There should be some queued tasks for this actor. */
-  RAY_CHECK(!entry.task_queue->empty());
-  /* If the worker is not available, we cannot assign a task to it. */
-  if (!entry.worker_available) {
-    return false;
-  }
-
-  /* Check whether we can execute the first task in the queue. */
-  auto task = entry.task_queue->begin();
-  TaskSpec *spec = task->Spec();
-  ActorHandleID next_task_handle_id = TaskSpec_actor_handle_id(spec);
-  /* We can only execute tasks in order of task_counter. */
-  if (TaskSpec_actor_counter(spec) !=
-      entry.task_counters[next_task_handle_id]) {
-    return false;
-  }
-
-  /* If there are not enough resources available, we cannot assign the task. */
-  RAY_CHECK(0 == TaskSpec_get_required_resource(spec, "GPU"));
-  if (!check_dynamic_resources(state, TaskSpec_get_required_resources(spec))) {
-    return false;
-  }
-
-  /* Update the task's execution dependencies to reflect the actual execution
-   * order to support deterministic reconstruction. */
-  /* NOTE(swang): The update of an actor task's execution dependencies is
-   * performed asynchronously. This means that if this local scheduler dies, we
-   * may lose updates that are in flight to the task table. We only guarantee
-   * deterministic reconstruction ordering for tasks whose updates are
-   * reflected in the task table. */
-  std::vector<ObjectID> ordered_execution_dependencies;
-  ordered_execution_dependencies.push_back(entry.execution_dependency);
-  task->SetExecutionDependencies(ordered_execution_dependencies);
-
-  /* Assign the first task in the task queue to the worker and mark the worker
-   * as unavailable. */
-  assign_task_to_worker(state, *task, entry.worker);
-  entry.execution_dependency = TaskSpec_actor_dummy_object(spec);
-  entry.worker_available = false;
-  /* Extend the frontier to include the assigned task. */
-  entry.task_counters[next_task_handle_id] += 1;
-  entry.frontier_dependencies[next_task_handle_id] = entry.execution_dependency;
-
-  /* Remove the task from the actor's task queue. */
-  entry.task_queue->erase(task);
-  /* If there are no more tasks in the queue, then indicate that the actor has
-   * no tasks. */
-  if (entry.task_queue->empty()) {
-    algorithm_state->actors_with_pending_tasks.erase(actor_id);
-  }
-
-  return true;
-}
-
-void handle_convert_worker_to_actor(
-    LocalSchedulerState *state,
-    SchedulingAlgorithmState *algorithm_state,
-    const ActorID &actor_id,
-    const ObjectID &initial_execution_dependency,
-    LocalSchedulerClient *worker) {
-  if (algorithm_state->local_actor_infos.count(actor_id) == 0) {
-    create_actor(algorithm_state, actor_id, initial_execution_dependency,
-                 worker);
-  } else {
-    /* In this case, the LocalActorInfo struct was already been created by the
-     * first call to add_task_to_actor_queue. However, the worker field was not
-     * filled out, so fill out the correct worker field now. */
-    algorithm_state->local_actor_infos[actor_id].worker = worker;
-  }
-  /* Increment the task counter for the creator's handle to account for the
-   * actor creation task. */
-  auto &task_counters =
-      algorithm_state->local_actor_infos[actor_id].task_counters;
-  RAY_CHECK(task_counters[ActorHandleID::nil()] == 0);
-  task_counters[ActorHandleID::nil()]++;
-}
-
-/**
- * Finishes a killed task by inserting dummy objects for each of its returns.
- */
-void finish_killed_task(LocalSchedulerState *state,
-                        TaskExecutionSpec &execution_spec) {
-  TaskSpec *spec = execution_spec.Spec();
-  int64_t num_returns = TaskSpec_num_returns(spec);
-  for (int i = 0; i < num_returns; i++) {
-    ObjectID object_id = TaskSpec_return(spec, i);
-    std::shared_ptr<Buffer> data;
-    // TODO(ekl): this writes an invalid arrow object, which is sufficient to
-    // signal that the worker failed, but it would be nice to return more
-    // detailed failure metadata in the future.
-    arrow::Status status =
-        state->plasma_conn->Create(object_id.to_plasma_id(), 1, NULL, 0, &data);
-    if (!status.IsPlasmaObjectExists()) {
-      ARROW_CHECK_OK(status);
-      ARROW_CHECK_OK(state->plasma_conn->Seal(object_id.to_plasma_id()));
-    }
-  }
-  /* Mark the task as done. */
-  if (state->db != NULL) {
-    Task *task = Task_alloc(execution_spec, TaskStatus::DONE,
-                            get_db_client_id(state->db));
-    // In most cases, task_table_update would be appropriate, however, it is
-    // possible in some cases that the task has not yet been added to the task
-    // table (e.g., if it is an actor task that is queued locally because the
-    // actor has not been created yet).
-    task_table_add_task(state->db, task, NULL, NULL, NULL);
-  }
-}
-
-/**
- * Insert a task queue entry into an actor's dispatch queue. The task is
- * inserted in sorted order by task counter. If this is the first task
- * scheduled to this actor and the worker process has not yet connected, then
- * this also creates a LocalActorInfo entry for the actor.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state The state of the scheduling algorithm.
- * @param task_entry The task queue entry to add to the actor's queue.
- * @return Void.
- */
-void insert_actor_task_queue(LocalSchedulerState *state,
-                             SchedulingAlgorithmState *algorithm_state,
-                             TaskExecutionSpec task_entry) {
-  TaskSpec *spec = task_entry.Spec();
-  /* Get the local actor entry for this actor. */
-  ActorID actor_id = TaskSpec_actor_id(spec);
-  ActorHandleID task_handle_id = TaskSpec_actor_handle_id(spec);
-  int64_t task_counter = TaskSpec_actor_counter(spec);
-
-  /* Fail the task immediately; it's destined for a dead actor. */
-  if (state->removed_actors.find(actor_id) != state->removed_actors.end()) {
-    finish_killed_task(state, task_entry);
-    return;
-  }
-
-  LocalActorInfo &entry =
-      algorithm_state->local_actor_infos.find(actor_id)->second;
-  if (entry.task_counters.count(task_handle_id) == 0) {
-    entry.task_counters[task_handle_id] = 0;
-  }
-  /* Extend the frontier to include the new handle. */
-  if (entry.frontier_dependencies.count(task_handle_id) == 0) {
-    RAY_CHECK(task_entry.ExecutionDependencies().size() == 1);
-    entry.frontier_dependencies[task_handle_id] =
-        task_entry.ExecutionDependencies()[0];
-  }
-
-  /* As a sanity check, the counter of the new task should be greater than the
-   * number of tasks that have executed on this actor so far (since we are
-   * guaranteeing in-order execution of the tasks on the actor). TODO(rkn): This
-   * check will fail if the fault-tolerance mechanism resubmits a task on an
-   * actor. */
-  if (task_counter < entry.task_counters[task_handle_id]) {
-    RAY_LOG(INFO) << "A task that has already been executed has been "
-                  << "resubmitted, so we are ignoring it. This should only "
-                  << "happen during reconstruction.";
-    return;
-  }
-
-  /* Insert the task spec to the actor's task queue in sorted order, per actor
-   * handle ID. Find the first task in the queue with a counter greater than
-   * the submitted task's and the same handle ID. */
-  auto it = entry.task_queue->begin();
-  for (; it != entry.task_queue->end(); it++) {
-    TaskSpec *pending_task_spec = it->Spec();
-    /* Skip tasks submitted by a different handle. */
-    if (!(task_handle_id == TaskSpec_actor_handle_id(pending_task_spec))) {
-      continue;
-    }
-    /* A duplicate task submitted by the same handle. */
-    if (task_counter == TaskSpec_actor_counter(pending_task_spec)) {
-      RAY_LOG(INFO) << "A task was resubmitted, so we are ignoring it. This "
-                    << "should only happen during reconstruction.";
-      return;
-    }
-    /* We found a task with the same handle ID and a greater task counter. */
-    if (task_counter < TaskSpec_actor_counter(pending_task_spec)) {
-      break;
-    }
-  }
-  entry.task_queue->insert(it, std::move(task_entry));
-
-  /* Record the fact that this actor has a task waiting to execute. */
-  algorithm_state->actors_with_pending_tasks.insert(actor_id);
-}
-
-/**
- * Queue a task to be dispatched for an actor. Update the task table for the
- * queued task. TODO(rkn): Should we also update the task table in the case
- * where the tasks are cached locally?
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state The state of the scheduling algorithm.
- * @param spec The task spec to add.
- * @param from_global_scheduler True if the task was assigned to this local
- *        scheduler by the global scheduler and false if it was submitted
- *        locally by a worker.
- * @return Void.
- */
-void queue_actor_task(LocalSchedulerState *state,
-                      SchedulingAlgorithmState *algorithm_state,
-                      TaskExecutionSpec &execution_spec,
-                      bool from_global_scheduler) {
-  TaskSpec *spec = execution_spec.Spec();
-  ActorID actor_id = TaskSpec_actor_id(spec);
-  RAY_CHECK(!actor_id.is_nil());
-
-  /* Update the task table. */
-  if (state->db != NULL) {
-    Task *task = Task_alloc(execution_spec, TaskStatus::QUEUED,
-                            get_db_client_id(state->db));
-    if (from_global_scheduler) {
-      /* If the task is from the global scheduler, it's already been added to
-       * the task table, so just update the entry. */
-      task_table_update(state->db, task, NULL, NULL, NULL);
-    } else {
-      /* Otherwise, this is the first time the task has been seen in the
-       * system (unless it's a resubmission of a previous task), so add the
-       * entry. */
-      task_table_add_task(state->db, task, NULL, NULL, NULL);
-    }
-  }
-
-  // Create a new task queue entry. This must come after the above block because
-  // insert_actor_task_queue may call task_table_update internally, which must
-  // come after the prior call to task_table_add_task.
-  TaskExecutionSpec copy = TaskExecutionSpec(&execution_spec);
-  insert_actor_task_queue(state, algorithm_state, std::move(copy));
-}
-
-/**
- * Fetch a queued task's missing object dependency. The fetch request will be
- * retried every local_scheduler_fetch_timeout_milliseconds until the object is
- * available locally.
- *
- * @param state The scheduler state.
- * @param algorithm_state The scheduling algorithm state.
- * @param task_entry_it A reference to the task entry in the waiting queue.
- * @param obj_id The ID of the object that the task is dependent on.
- * @param request_transfer Whether to request a transfer of this object from
- *        other plasma managers. This should be set to false for execution
- *        dependencies, which should be fulfilled by executing the
- *        corresponding task locally.
- * @returns Void.
- */
-void fetch_missing_dependency(
-    LocalSchedulerState *state,
-    SchedulingAlgorithmState *algorithm_state,
-    std::list<TaskExecutionSpec>::iterator task_entry_it,
-    plasma::ObjectID obj_id,
-    bool request_transfer) {
-  if (algorithm_state->remote_objects.count(obj_id) == 0) {
-    /* We weren't actively fetching this object. Try the fetch once
-     * immediately. */
-    if (state->plasma_conn->get_manager_fd() != -1) {
-      auto arrow_status = state->plasma_conn->Fetch(1, &obj_id);
-      if (!arrow_status.ok()) {
-        LocalSchedulerState_free(state);
-        /* TODO(swang): Local scheduler should also exit even if there are no
-         * pending fetches. This could be done by subscribing to the db_client
-         * table, or pinging the plasma manager in the heartbeat handler. */
-        RAY_LOG(FATAL) << "Lost connection to the plasma manager, local "
-                       << "scheduler is exiting. Error: "
-                       << arrow_status.ToString();
-      }
-    }
-    /* Create an entry and add it to the list of active fetch requests to
-     * ensure that the fetch actually happens. The entry will be moved to the
-     * hash table of locally available objects in handle_object_available when
-     * the object becomes available locally. It will get freed if the object is
-     * subsequently removed locally. */
-    ObjectEntry entry;
-    entry.request_transfer = request_transfer;
-    algorithm_state->remote_objects[obj_id] = entry;
-  }
-  algorithm_state->remote_objects[obj_id].dependent_tasks.push_back(
-      task_entry_it);
-}
-
-/**
- * Fetch a queued task's missing object dependencies. The fetch requests will
- * be retried every local_scheduler_fetch_timeout_milliseconds until all
- * objects are available locally.
- *
- * @param state The scheduler state.
- * @param algorithm_state The scheduling algorithm state.
- * @param task_entry_it A reference to the task entry in the waiting queue.
- * @returns Void.
- */
-void fetch_missing_dependencies(
-    LocalSchedulerState *state,
-    SchedulingAlgorithmState *algorithm_state,
-    std::list<TaskExecutionSpec>::iterator task_entry_it) {
-  int64_t num_dependencies = task_entry_it->NumDependencies();
-  int num_missing_dependencies = 0;
-  for (int64_t i = 0; i < num_dependencies; ++i) {
-    int count = task_entry_it->DependencyIdCount(i);
-    for (int j = 0; j < count; ++j) {
-      ObjectID obj_id = task_entry_it->DependencyId(i, j);
-      /* If the entry is not yet available locally, record the dependency. */
-      if (algorithm_state->local_objects.count(obj_id) == 0) {
-        /* Do not request a transfer from other plasma managers if this is an
-         * execution dependency. */
-        bool request_transfer = task_entry_it->IsStaticDependency(i);
-        fetch_missing_dependency(state, algorithm_state, task_entry_it,
-                                 obj_id.to_plasma_id(), request_transfer);
-        ++num_missing_dependencies;
-      }
-    }
-  }
-  RAY_CHECK(num_missing_dependencies > 0);
-}
-
-/**
- * Clear a queued task's missing object dependencies. This is the inverse of
- * fetch_missing_dependencies.
- * TODO(swang): Test this function.
- *
- * @param algorithm_state The scheduling algorithm state.
- * @param task_entry_it A reference to the task entry in the waiting queue.
- * @returns Void.
- */
-void clear_missing_dependencies(
-    SchedulingAlgorithmState *algorithm_state,
-    std::list<TaskExecutionSpec>::iterator task_entry_it) {
-  int64_t num_dependencies = task_entry_it->NumDependencies();
-  for (int64_t i = 0; i < num_dependencies; ++i) {
-    int count = task_entry_it->DependencyIdCount(i);
-    for (int j = 0; j < count; ++j) {
-      ObjectID obj_id = task_entry_it->DependencyId(i, j);
-      /* If this object dependency is missing, remove this task from the
-       * object's list of dependent tasks. */
-      auto entry = algorithm_state->remote_objects.find(obj_id);
-      if (entry != algorithm_state->remote_objects.end()) {
-        /* Find and remove the given task. */
-        auto &dependent_tasks = entry->second.dependent_tasks;
-        for (auto dependent_task_it = dependent_tasks.begin();
-             dependent_task_it != dependent_tasks.end();) {
-          if (*dependent_task_it == task_entry_it) {
-            dependent_task_it = dependent_tasks.erase(dependent_task_it);
-          } else {
-            dependent_task_it++;
-          }
-        }
-        /* If the missing object dependency has no more dependent tasks, then
-         * remove it. */
-        if (dependent_tasks.empty()) {
-          algorithm_state->remote_objects.erase(entry);
-        }
-      }
-    }
-  }
-}
-
-/**
- * Check if all of the remote object arguments for a task are available in the
- * local object store.
- *
- * @param algorithm_state The scheduling algorithm state.
- * @param task Task specification of the task to check.
- * @return bool This returns true if all of the remote object arguments for the
- *         task are present in the local object store, otherwise it returns
- *         false.
- */
-bool can_run(SchedulingAlgorithmState *algorithm_state,
-             TaskExecutionSpec &task) {
-  int64_t num_dependencies = task.NumDependencies();
-  for (int i = 0; i < num_dependencies; ++i) {
-    int count = task.DependencyIdCount(i);
-    for (int j = 0; j < count; ++j) {
-      ObjectID obj_id = task.DependencyId(i, j);
-      if (algorithm_state->local_objects.count(obj_id) == 0) {
-        /* The object is not present locally, so this task cannot be scheduled
-         * right now. */
-        return false;
-      }
-    }
-  }
-  return true;
-}
-
-bool object_locally_available(SchedulingAlgorithmState *algorithm_state,
-                              ObjectID object_id) {
-  return algorithm_state->local_objects.count(object_id) == 1;
-}
-
-/* TODO(swang): This method is not covered by any valgrind tests. */
-int fetch_object_timeout_handler(event_loop *loop, timer_id id, void *context) {
-  int64_t start_time = current_time_ms();
-
-  LocalSchedulerState *state = (LocalSchedulerState *) context;
-  /* Only try the fetches if we are connected to the object store manager. */
-  if (state->plasma_conn->get_manager_fd() == -1) {
-    RAY_LOG(INFO)
-        << "Local scheduler is not connected to a object store manager";
-    return RayConfig::instance().local_scheduler_fetch_timeout_milliseconds();
-  }
-
-  std::vector<ObjectID> object_id_vec;
-  for (auto const &entry : state->algorithm_state->remote_objects) {
-    if (entry.second.request_transfer) {
-      object_id_vec.push_back(entry.first);
-    }
-  }
-
-  ObjectID *object_ids = object_id_vec.data();
-  int64_t num_object_ids = object_id_vec.size();
-
-  /* Divide very large fetch requests into smaller fetch requests so that a
-   * single fetch request doesn't block the plasma manager for a long time. */
-  for (int64_t j = 0; j < num_object_ids;
-       j += RayConfig::instance().local_scheduler_fetch_request_size()) {
-    int num_objects_in_request =
-        std::min(
-            num_object_ids,
-            j + RayConfig::instance().local_scheduler_fetch_request_size()) -
-        j;
-    auto arrow_status = state->plasma_conn->Fetch(
-        num_objects_in_request,
-        reinterpret_cast<plasma::ObjectID *>(&object_ids[j]));
-    if (!arrow_status.ok()) {
-      LocalSchedulerState_free(state);
-      RAY_LOG(FATAL) << "Lost connection to the plasma manager, local "
-                     << "scheduler is exiting. Error: "
-                     << arrow_status.ToString();
-    }
-  }
-
-  /* Print a warning if this method took too long. */
-  int64_t end_time = current_time_ms();
-  if (end_time - start_time >
-      RayConfig::instance().max_time_for_handler_milliseconds()) {
-    RAY_LOG(WARNING) << "fetch_object_timeout_handler took "
-                     << end_time - start_time << " milliseconds.";
-  }
-
-  /* Wait at least local_scheduler_fetch_timeout_milliseconds before running
-   * this timeout handler again. But if we're waiting for a large number of
-   * objects, wait longer (e.g., 10 seconds for one million objects) so that we
-   * don't overwhelm the plasma manager. */
-  return std::max(
-      RayConfig::instance().local_scheduler_fetch_timeout_milliseconds(),
-      int64_t(0.01 * num_object_ids));
-}
-
-/* TODO(swang): This method is not covered by any valgrind tests. */
-int reconstruct_object_timeout_handler(event_loop *loop,
-                                       timer_id id,
-                                       void *context) {
-  int64_t start_time = current_time_ms();
-
-  LocalSchedulerState *state = (LocalSchedulerState *) context;
-
-  /* This vector is used to track which object IDs to reconstruct next. If the
-   * vector is empty, we repopulate it with all of the keys of the remote object
-   * table. During every pass through this handler, we call reconstruct on up to
-   * max_num_to_reconstruct elements of the vector (after first checking that
-   * the object IDs are still missing). */
-  static std::vector<ObjectID> object_ids_to_reconstruct;
-
-  /* If the set is empty, repopulate it. */
-  if (object_ids_to_reconstruct.size() == 0) {
-    for (auto const &entry : state->algorithm_state->remote_objects) {
-      object_ids_to_reconstruct.push_back(entry.first);
-    }
-  }
-
-  int64_t num_reconstructed = 0;
-  for (size_t i = 0; i < object_ids_to_reconstruct.size(); i++) {
-    ObjectID object_id = object_ids_to_reconstruct[i];
-    /* Only call reconstruct if we are still missing the object. */
-    if (state->algorithm_state->remote_objects.find(object_id) !=
-        state->algorithm_state->remote_objects.end()) {
-      reconstruct_object(state, object_id);
-    }
-    num_reconstructed++;
-    if (num_reconstructed == RayConfig::instance().max_num_to_reconstruct()) {
-      break;
-    }
-  }
-  object_ids_to_reconstruct.erase(
-      object_ids_to_reconstruct.begin(),
-      object_ids_to_reconstruct.begin() + num_reconstructed);
-
-  /* Print a warning if this method took too long. */
-  int64_t end_time = current_time_ms();
-  if (end_time - start_time >
-      RayConfig::instance().max_time_for_handler_milliseconds()) {
-    RAY_LOG(WARNING) << "reconstruct_object_timeout_handler took "
-                     << end_time - start_time << " milliseconds.";
-  }
-
-  return RayConfig::instance()
-      .local_scheduler_reconstruction_timeout_milliseconds();
-}
-
-int rerun_actor_creation_tasks_timeout_handler(event_loop *loop,
-                                               timer_id id,
-                                               void *context) {
-  int64_t start_time = current_time_ms();
-
-  LocalSchedulerState *state = (LocalSchedulerState *) context;
-
-  // Create a set of the dummy object IDs for the actor creation tasks to
-  // reconstruct.
-  std::unordered_set<ObjectID> actor_dummy_objects;
-  for (auto const &execution_spec :
-       state->algorithm_state->cached_submitted_actor_tasks) {
-    ObjectID actor_creation_dummy_object_id =
-        TaskSpec_actor_creation_dummy_object_id(execution_spec.Spec());
-    actor_dummy_objects.insert(actor_creation_dummy_object_id);
-  }
-
-  // Issue reconstruct calls.
-  for (auto const &object_id : actor_dummy_objects) {
-    reconstruct_object(state, object_id);
-  }
-
-  // Print a warning if this method took too long.
-  int64_t end_time = current_time_ms();
-  if (end_time - start_time >
-      RayConfig::instance().max_time_for_handler_milliseconds()) {
-    RAY_LOG(WARNING) << "reconstruct_object_timeout_handler took "
-                     << end_time - start_time << " milliseconds.";
-  }
-
-  return RayConfig::instance()
-      .local_scheduler_reconstruction_timeout_milliseconds();
-}
-
-/**
- * Return true if there are still some resources available and false otherwise.
- *
- * @param state The scheduler state.
- * @return True if there are still some resources and false if there are not.
- */
-bool resources_available(LocalSchedulerState *state) {
-  bool resources_available = false;
-  for (auto const &resource_pair : state->dynamic_resources) {
-    if (resource_pair.second > 0) {
-      resources_available = true;
-    }
-  }
-  return resources_available;
-}
-
-void spillback_tasks_handler(LocalSchedulerState *state) {
-  SchedulingAlgorithmState *algorithm_state = state->algorithm_state;
-
-  int64_t num_to_spillback = std::min(
-      static_cast<int64_t>(algorithm_state->dispatch_task_queue->size()),
-      RayConfig::instance().max_tasks_to_spillback());
-
-  auto it = algorithm_state->dispatch_task_queue->end();
-  for (int64_t i = 0; i < num_to_spillback; i++) {
-    it--;
-  }
-
-  for (int64_t i = 0; i < num_to_spillback; i++) {
-    it->IncrementSpillbackCount();
-    // If an actor hasn't been created for a while, push a warning to the
-    // driver.
-    if (it->SpillbackCount() %
-            RayConfig::instance().actor_creation_num_spillbacks_warning() ==
-        0) {
-      TaskSpec *spec = it->Spec();
-      if (TaskSpec_is_actor_creation_task(spec)) {
-        std::ostringstream error_message;
-        error_message << "The actor with ID "
-                      << TaskSpec_actor_creation_id(spec) << " is taking a "
-                      << "while to be created. It is possible that the "
-                      << "cluster does not have enough resources to place this "
-                      << "actor (this may be normal while an autoscaling "
-                      << "is scaling up). Consider reducing the number of "
-                      << "actors created, or "
-                      << "increasing the number of slots available by using "
-                      << "the --num-cpus, --num-gpus, and --resources flags. "
-                      << "The actor creation task is requesting ";
-        for (auto const &resource_pair :
-             TaskSpec_get_required_resources(spec)) {
-          error_message << resource_pair.second << " " << resource_pair.first
-                        << " ";
-        }
-        push_error(state->db, TaskSpec_driver_id(spec),
-                   ErrorIndex::ACTOR_NOT_CREATED, error_message.str());
-      }
-    }
-
-    give_task_to_global_scheduler(state, algorithm_state, *it);
-    // Dequeue the task.
-    it = algorithm_state->dispatch_task_queue->erase(it);
-  }
-}
-
-/**
- * Assign as many tasks from the dispatch queue as possible.
- *
- * @param state The scheduler state.
- * @param algorithm_state The scheduling algorithm state.
- * @return Void.
- */
-void dispatch_tasks(LocalSchedulerState *state,
-                    SchedulingAlgorithmState *algorithm_state) {
-  /* Assign as many tasks as we can, while there are workers available. */
-  for (auto it = algorithm_state->dispatch_task_queue->begin();
-       it != algorithm_state->dispatch_task_queue->end();) {
-    TaskSpec *spec = it->Spec();
-    /* If there is a task to assign, but there are no more available workers in
-     * the worker pool, then exit. Ensure that there will be an available
-     * worker during a future invocation of dispatch_tasks. */
-    if (algorithm_state->available_workers.size() == 0) {
-      if (state->child_pids.size() == 0) {
-        /* If there are no workers, including those pending PID registration,
-         * then we must start a new one to replenish the worker pool. */
-        start_worker(state);
-      }
-      return;
-    }
-
-    /* Terminate early if there are no more resources available. */
-    if (!resources_available(state)) {
-      return;
-    }
-
-    /* Skip to the next task if this task cannot currently be satisfied. */
-    if (!check_dynamic_resources(state,
-                                 TaskSpec_get_required_resources(spec))) {
-      /* This task could not be satisfied -- proceed to the next task. */
-      ++it;
-      continue;
-    }
-
-    /* Dispatch this task to an available worker and dequeue the task. */
-    RAY_LOG(DEBUG) << "Dispatching task";
-    /* Get the last available worker in the available worker queue. */
-    LocalSchedulerClient *worker = algorithm_state->available_workers.back();
-    /* Tell the available worker to execute the task. */
-    assign_task_to_worker(state, *it, worker);
-    /* Remove the worker from the available queue, and add it to the executing
-     * workers. */
-    algorithm_state->available_workers.pop_back();
-    algorithm_state->executing_workers.push_back(worker);
-    print_resource_info(state, spec);
-    /* Dequeue the task. */
-    it = algorithm_state->dispatch_task_queue->erase(it);
-  } /* End for each task in the dispatch queue. */
-}
-
-/**
- * Attempt to dispatch both regular tasks and actor tasks.
- *
- * @param state The scheduler state.
- * @param algorithm_state The scheduling algorithm state.
- * @return Void.
- */
-void dispatch_all_tasks(LocalSchedulerState *state,
-                        SchedulingAlgorithmState *algorithm_state) {
-  /* First attempt to dispatch regular tasks. */
-  dispatch_tasks(state, algorithm_state);
-
-  /* Attempt to dispatch actor tasks. */
-  auto it = algorithm_state->actors_with_pending_tasks.begin();
-  while (it != algorithm_state->actors_with_pending_tasks.end()) {
-    // We cannot short-circuit and exit here if there are no resources
-    // available because actor methods may require 0 CPUs.
-
-    /* We increment the iterator ahead of time because the call to
-     * dispatch_actor_task may invalidate the current iterator. */
-    ActorID actor_id = *it;
-    it++;
-    /* Dispatch tasks for the current actor. */
-    dispatch_actor_task(state, algorithm_state, actor_id);
-  }
-}
-
-/**
- * A helper function to allocate a queue entry for a task specification and
- * push it onto a generic queue.
- *
- * @param state The state of the local scheduler.
- * @param task_queue A pointer to a task queue. NOTE: Because we are using
- *        utlist.h, we must pass in a pointer to the queue we want to append
- *        to. If we passed in the queue itself and the queue was empty, this
- *        would append the task to a queue that we don't have a reference to.
- * @param task_entry A pointer to the task entry to queue.
- * @param from_global_scheduler Whether or not the task was from a global
- *        scheduler. If false, the task was submitted by a worker.
- * @return A reference to the entry in the queue that was pushed.
- */
-std::list<TaskExecutionSpec>::iterator queue_task(
-    LocalSchedulerState *state,
-    std::list<TaskExecutionSpec> *task_queue,
-    TaskExecutionSpec &task_entry,
-    bool from_global_scheduler) {
-  /* The task has been added to a local scheduler queue. Write the entry in the
-   * task table to notify others that we have queued it. */
-  if (state->db != NULL) {
-    Task *task =
-        Task_alloc(task_entry, TaskStatus::QUEUED, get_db_client_id(state->db));
-    if (from_global_scheduler) {
-      /* If the task is from the global scheduler, it's already been added to
-       * the task table, so just update the entry. */
-      task_table_update(state->db, task, NULL, NULL, NULL);
-    } else {
-      /* Otherwise, this is the first time the task has been seen in the system
-       * (unless it's a resubmission of a previous task), so add the entry. */
-      task_table_add_task(state->db, task, NULL, NULL, NULL);
-    }
-  }
-
-  /* Copy the spec and add it to the task queue. The allocated spec will be
-   * freed when it is assigned to a worker. */
-  TaskExecutionSpec copy = TaskExecutionSpec(&task_entry);
-  task_queue->push_back(std::move(copy));
-  /* Since we just queued the task, we can get a reference to it by going to
-   * the last element in the queue. */
-  auto it = task_queue->end();
-  --it;
-
-  return it;
-}
-
-/**
- * Queue a task whose dependencies are missing. When the task's object
- * dependencies become available, the task will be moved to the dispatch queue.
- * If we have a connection to a plasma manager, begin trying to fetch the
- * dependencies.
- *
- * @param state The scheduler state.
- * @param algorithm_state The scheduling algorithm state.
- * @param spec The task specification to queue.
- * @param from_global_scheduler Whether or not the task was from a global
- *        scheduler. If false, the task was submitted by a worker.
- * @return Void.
- */
-void queue_waiting_task(LocalSchedulerState *state,
-                        SchedulingAlgorithmState *algorithm_state,
-                        TaskExecutionSpec &execution_spec,
-                        bool from_global_scheduler) {
-  /* For actor tasks, do not queue tasks that have already been executed. */
-  auto spec = execution_spec.Spec();
-  if (!TaskSpec_actor_id(spec).is_nil()) {
-    auto entry =
-        algorithm_state->local_actor_infos.find(TaskSpec_actor_id(spec));
-    if (entry != algorithm_state->local_actor_infos.end()) {
-      /* Find the highest task counter with the same handle ID as the task to
-       * queue. */
-      auto &task_counters = entry->second.task_counters;
-      auto task_counter = task_counters.find(TaskSpec_actor_handle_id(spec));
-      if (task_counter != task_counters.end() &&
-          TaskSpec_actor_counter(spec) < task_counter->second) {
-        /* If the task to queue has a lower task counter, do not queue it. */
-        RAY_LOG(INFO) << "A task that has already been executed has been "
-                      << "resubmitted, so we are ignoring it. This should only "
-                      << "happen during reconstruction.";
-        return;
-      }
-    }
-  }
-
-  RAY_LOG(DEBUG) << "Queueing task in waiting queue";
-  auto it = queue_task(state, algorithm_state->waiting_task_queue,
-                       execution_spec, from_global_scheduler);
-  fetch_missing_dependencies(state, algorithm_state, it);
-}
-
-/**
- * Queue a task whose dependencies are ready. When the task reaches the front
- * of the dispatch queue and workers are available, it will be assigned.
- *
- * @param state The scheduler state.
- * @param algorithm_state The scheduling algorithm state.
- * @param spec The task specification to queue.
- * @param from_global_scheduler Whether or not the task was from a global
- *        scheduler. If false, the task was submitted by a worker.
- * @return Void.
- */
-void queue_dispatch_task(LocalSchedulerState *state,
-                         SchedulingAlgorithmState *algorithm_state,
-                         TaskExecutionSpec &execution_spec,
-                         bool from_global_scheduler) {
-  RAY_LOG(DEBUG) << "Queueing task in dispatch queue";
-  TaskSpec *spec = execution_spec.Spec();
-  if (TaskSpec_is_actor_task(spec)) {
-    queue_actor_task(state, algorithm_state, execution_spec,
-                     from_global_scheduler);
-  } else {
-    queue_task(state, algorithm_state->dispatch_task_queue, execution_spec,
-               from_global_scheduler);
-  }
-}
-
-/**
- * Add the task to the proper local scheduler queue. This assumes that the
- * scheduling decision to place the task on this node has already been made,
- * whether locally or by the global scheduler.
- *
- * @param state The scheduler state.
- * @param algorithm_state The scheduling algorithm state.
- * @param spec The task specification to queue.
- * @param from_global_scheduler Whether or not the task was from a global
- *        scheduler. If false, the task was submitted by a worker.
- * @return Void.
- */
-void queue_task_locally(LocalSchedulerState *state,
-                        SchedulingAlgorithmState *algorithm_state,
-                        TaskExecutionSpec &execution_spec,
-                        bool from_global_scheduler) {
-  if (can_run(algorithm_state, execution_spec)) {
-    /* Dependencies are ready, so push the task to the dispatch queue. */
-    queue_dispatch_task(state, algorithm_state, execution_spec,
-                        from_global_scheduler);
-  } else {
-    /* Dependencies are not ready, so push the task to the waiting queue. */
-    queue_waiting_task(state, algorithm_state, execution_spec,
-                       from_global_scheduler);
-  }
-}
-
-void give_task_to_local_scheduler_retry(UniqueID id,
-                                        void *user_context,
-                                        void *user_data) {
-  LocalSchedulerState *state = (LocalSchedulerState *) user_context;
-  Task *task = (Task *) user_data;
-  RAY_CHECK(Task_state(task) == TaskStatus::SCHEDULED);
-
-  TaskExecutionSpec *execution_spec = Task_task_execution_spec(task);
-  TaskSpec *spec = execution_spec->Spec();
-  RAY_CHECK(TaskSpec_is_actor_task(spec));
-
-  ActorID actor_id = TaskSpec_actor_id(spec);
-
-  if (state->actor_mapping.count(actor_id) == 0) {
-    // Process the actor task submission again. This will cache the task
-    // locally until a new actor creation notification is broadcast. We will
-    // attempt to reissue the actor creation tasks for all cached actor tasks
-    // in rerun_actor_creation_tasks_timeout_handler.
-    handle_actor_task_submitted(state, state->algorithm_state, *execution_spec);
-    return;
-  }
-
-  DBClientID remote_local_scheduler_id =
-      state->actor_mapping[actor_id].local_scheduler_id;
-
-  // TODO(rkn): db_client_table_cache_get is a blocking call, is this a
-  // performance issue?
-  DBClient remote_local_scheduler =
-      db_client_table_cache_get(state->db, remote_local_scheduler_id);
-
-  // Check if the local scheduler that we're assigning this task to is still
-  // alive.
-  if (remote_local_scheduler.is_alive) {
-    // The local scheduler is still alive, which means that perhaps it hasn't
-    // subscribed to the appropriate channel yet, so retrying should suffice.
-    // This should be rare.
-    give_task_to_local_scheduler(
-        state, state->algorithm_state, *execution_spec,
-        state->actor_mapping[actor_id].local_scheduler_id);
-  } else {
-    // The local scheduler is dead, so we will need to recreate the actor by
-    // invoking reconstruction.
-    RAY_LOG(INFO) << "Local scheduler " << remote_local_scheduler_id
-                  << " that was running actor " << actor_id << " died.";
-    RAY_CHECK(state->actor_mapping.count(actor_id) == 1);
-    // Update the actor mapping.
-    state->actor_mapping.erase(actor_id);
-    // Process the actor task submission again. This will cache the task
-    // locally until a new actor creation notification is broadcast. We will
-    // attempt to reissue the actor creation tasks for all cached actor tasks
-    // in rerun_actor_creation_tasks_timeout_handler.
-    handle_actor_task_submitted(state, state->algorithm_state, *execution_spec);
-  }
-}
-
-/**
- * Give a task directly to another local scheduler. This is currently only used
- * for assigning actor tasks to the local scheduler responsible for that actor.
- *
- * @param state The scheduler state.
- * @param algorithm_state The scheduling algorithm state.
- * @param spec The task specification to schedule.
- * @param local_scheduler_id The ID of the local scheduler to give the task to.
- * @return Void.
- */
-void give_task_to_local_scheduler(LocalSchedulerState *state,
-                                  SchedulingAlgorithmState *algorithm_state,
-                                  TaskExecutionSpec &execution_spec,
-                                  DBClientID local_scheduler_id) {
-  if (local_scheduler_id == get_db_client_id(state->db)) {
-    RAY_LOG(WARNING) << "Local scheduler is trying to assign a task to itself.";
-  }
-  RAY_CHECK(state->db != NULL);
-  /* Assign the task to the relevant local scheduler. */
-  RAY_CHECK(state->config.global_scheduler_exists);
-  Task *task =
-      Task_alloc(execution_spec, TaskStatus::SCHEDULED, local_scheduler_id);
-  auto retryInfo = RetryInfo{
-      .num_retries = 0,  // This value is unused.
-      .timeout = 0,      // This value is unused.
-      .fail_callback = give_task_to_local_scheduler_retry,
-  };
-
-  task_table_add_task(state->db, task, &retryInfo, NULL, state);
-}
-
-void give_task_to_global_scheduler_retry(UniqueID id,
-                                         void *user_context,
-                                         void *user_data) {
-  LocalSchedulerState *state = (LocalSchedulerState *) user_context;
-  Task *task = (Task *) user_data;
-  RAY_CHECK(Task_state(task) == TaskStatus::WAITING);
-
-  TaskExecutionSpec *execution_spec = Task_task_execution_spec(task);
-  TaskSpec *spec = execution_spec->Spec();
-  RAY_CHECK(!TaskSpec_is_actor_task(spec));
-
-  give_task_to_global_scheduler(state, state->algorithm_state, *execution_spec);
-}
-
-/**
- * Give a task to the global scheduler to schedule.
- *
- * @param state The scheduler state.
- * @param algorithm_state The scheduling algorithm state.
- * @param spec The task specification to schedule.
- * @return Void.
- */
-void give_task_to_global_scheduler(LocalSchedulerState *state,
-                                   SchedulingAlgorithmState *algorithm_state,
-                                   TaskExecutionSpec &execution_spec) {
-  if (state->db == NULL || !state->config.global_scheduler_exists) {
-    /* A global scheduler is not available, so queue the task locally. */
-    queue_task_locally(state, algorithm_state, execution_spec, false);
-    return;
-  }
-  /* Pass on the task to the global scheduler. */
-  RAY_CHECK(state->config.global_scheduler_exists);
-  Task *task = Task_alloc(execution_spec, TaskStatus::WAITING,
-                          get_db_client_id(state->db));
-  RAY_CHECK(state->db != NULL);
-  auto retryInfo = RetryInfo{
-      .num_retries = 0,  // This value is unused.
-      .timeout = 0,      // This value is unused.
-      .fail_callback = give_task_to_global_scheduler_retry,
-  };
-  task_table_add_task(state->db, task, &retryInfo, NULL, state);
-}
-
-bool resource_constraints_satisfied(LocalSchedulerState *state,
-                                    TaskSpec *spec) {
-  /* At the local scheduler, if required resource vector exceeds either static
-   * or dynamic resource vector, the resource constraint is not satisfied. */
-  for (auto const &resource_pair : TaskSpec_get_required_resources(spec)) {
-    double required_resource = resource_pair.second;
-    if (required_resource > state->static_resources[resource_pair.first] ||
-        required_resource > state->dynamic_resources[resource_pair.first]) {
-      return false;
-    }
-  }
-
-  if (TaskSpec_is_actor_creation_task(spec) &&
-      state->static_resources["CPU"] != 0) {
-    return false;
-  }
-
-  return true;
-}
-
-void handle_task_submitted(LocalSchedulerState *state,
-                           SchedulingAlgorithmState *algorithm_state,
-                           TaskExecutionSpec &execution_spec) {
-  TaskSpec *spec = execution_spec.Spec();
-  /* TODO(atumanov): if static is satisfied and local objects ready, but dynamic
-   * resource is currently unavailable, then consider queueing task locally and
-   * recheck dynamic next time. */
-
-  // If this task's constraints are satisfied, dependencies are available
-  // locally, and there is an available worker, then enqueue the task in the
-  // dispatch queue and trigger task dispatch. Otherwise, pass the task along to
-  // the global scheduler if there is one.
-  // Note that actor creation tasks automatically go to the global scheduler.
-  // See https://github.com/ray-project/ray/issues/1756 for more discussion.
-  // This is a hack to improve actor load balancing (and to prevent the scenario
-  // where all actors are started locally).
-  if (resource_constraints_satisfied(state, spec) &&
-      (algorithm_state->available_workers.size() > 0) &&
-      can_run(algorithm_state, execution_spec) &&
-      !TaskSpec_is_actor_creation_task(spec)) {
-    queue_dispatch_task(state, algorithm_state, execution_spec, false);
-  } else {
-    /* Give the task to the global scheduler to schedule, if it exists. */
-    give_task_to_global_scheduler(state, algorithm_state, execution_spec);
-  }
-
-  /* Try to dispatch tasks, since we may have added one to the queue. */
-  dispatch_tasks(state, algorithm_state);
-}
-
-void handle_actor_task_submitted(LocalSchedulerState *state,
-                                 SchedulingAlgorithmState *algorithm_state,
-                                 TaskExecutionSpec &execution_spec) {
-  TaskSpec *task_spec = execution_spec.Spec();
-  RAY_CHECK(TaskSpec_is_actor_task(task_spec));
-  ActorID actor_id = TaskSpec_actor_id(task_spec);
-
-  if (state->actor_mapping.count(actor_id) == 0) {
-    // Create a copy of the task to write to the task table.
-    Task *task = Task_alloc(
-        task_spec, execution_spec.SpecSize(), TaskStatus::ACTOR_CACHED,
-        get_db_client_id(state->db), execution_spec.ExecutionDependencies());
-
-    /* Add this task to a queue of tasks that have been submitted but the local
-     * scheduler doesn't know which actor is responsible for them. These tasks
-     * will be resubmitted (internally by the local scheduler) whenever a new
-     * actor notification arrives. NOTE(swang): These tasks have not yet been
-     * added to the task table. */
-    TaskExecutionSpec task_entry = TaskExecutionSpec(&execution_spec);
-    algorithm_state->cached_submitted_actor_tasks.push_back(
-        std::move(task_entry));
-
-    // Even if the task can't be assigned to a worker yet, we should still write
-    // it to the task table. TODO(rkn): There's no need to do this more than
-    // once, and we could run into problems if we have very large numbers of
-    // tasks in this cache.
-    task_table_add_task(state->db, task, NULL, NULL, NULL);
-
-    return;
-  }
-
-  if (state->actor_mapping[actor_id].local_scheduler_id ==
-      get_db_client_id(state->db)) {
-    /* This local scheduler is responsible for the actor, so handle the task
-     * locally. */
-    queue_task_locally(state, algorithm_state, execution_spec, false);
-    /* Attempt to dispatch tasks to this actor. */
-    dispatch_actor_task(state, algorithm_state, actor_id);
-  } else {
-    /* This local scheduler is not responsible for the task, so find the local
-     * scheduler that is responsible for this actor and assign the task directly
-     * to that local scheduler. */
-    give_task_to_local_scheduler(
-        state, algorithm_state, execution_spec,
-        state->actor_mapping[actor_id].local_scheduler_id);
-  }
-}
-
-void handle_actor_creation_notification(
-    LocalSchedulerState *state,
-    SchedulingAlgorithmState *algorithm_state,
-    ActorID actor_id) {
-  int num_cached_actor_tasks =
-      algorithm_state->cached_submitted_actor_tasks.size();
-
-  for (int i = 0; i < num_cached_actor_tasks; ++i) {
-    TaskExecutionSpec &task = algorithm_state->cached_submitted_actor_tasks[i];
-    /* Note that handle_actor_task_submitted may append the spec to the end of
-     * the cached_submitted_actor_tasks array. */
-    handle_actor_task_submitted(state, algorithm_state, task);
-  }
-  /* Remove all the tasks that were resubmitted. This does not erase the tasks
-   * that were newly appended to the cached_submitted_actor_tasks array. */
-  auto begin = algorithm_state->cached_submitted_actor_tasks.begin();
-  algorithm_state->cached_submitted_actor_tasks.erase(
-      begin, begin + num_cached_actor_tasks);
-}
-
-void handle_task_scheduled(LocalSchedulerState *state,
-                           SchedulingAlgorithmState *algorithm_state,
-                           TaskExecutionSpec &execution_spec) {
-  /* This callback handles tasks that were assigned to this local scheduler by
-   * the global scheduler, so we can safely assert that there is a connection to
-   * the database. */
-  RAY_CHECK(state->db != NULL);
-  RAY_CHECK(state->config.global_scheduler_exists);
-
-  // Currently, the global scheduler will never assign a task to a local
-  // scheduler that has 0 CPUs.
-  RAY_CHECK(state->static_resources["CPU"] != 0);
-
-  // Push the task to the appropriate queue.
-  queue_task_locally(state, algorithm_state, execution_spec, true);
-  dispatch_tasks(state, algorithm_state);
-}
-
-void handle_actor_task_scheduled(LocalSchedulerState *state,
-                                 SchedulingAlgorithmState *algorithm_state,
-                                 TaskExecutionSpec &execution_spec) {
-  TaskSpec *spec = execution_spec.Spec();
-  /* This callback handles tasks that were assigned to this local scheduler by
-   * the global scheduler or by other workers, so we can safely assert that
-   * there is a connection to the database. */
-  RAY_CHECK(state->db != NULL);
-  RAY_CHECK(state->config.global_scheduler_exists);
-  /* Check that the task is meant to run on an actor that this local scheduler
-   * is responsible for. */
-  RAY_CHECK(TaskSpec_is_actor_task(spec));
-  ActorID actor_id = TaskSpec_actor_id(spec);
-  if (state->actor_mapping.count(actor_id) == 1) {
-    RAY_CHECK(state->actor_mapping[actor_id].local_scheduler_id ==
-              get_db_client_id(state->db));
-  } else {
-    /* This means that an actor has been assigned to this local scheduler, and a
-     * task for that actor has been received by this local scheduler, but this
-     * local scheduler has not yet processed the notification about the actor
-     * creation. This may be possible though should be very uncommon. If it does
-     * happen, it's ok. */
-    RAY_LOG(INFO) << "handle_actor_task_scheduled called on local scheduler "
-                  << "but the corresponding actor_map_entry is not present. "
-                  << "This should be rare.";
-  }
-  /* Push the task to the appropriate queue. */
-  queue_task_locally(state, algorithm_state, execution_spec, true);
-  dispatch_actor_task(state, algorithm_state, actor_id);
-}
-
-void handle_worker_available(LocalSchedulerState *state,
-                             SchedulingAlgorithmState *algorithm_state,
-                             LocalSchedulerClient *worker) {
-  RAY_CHECK(worker->task_in_progress == NULL);
-  /* Check that the worker isn't in the pool of available workers. */
-  RAY_CHECK(!worker_in_vector(algorithm_state->available_workers, worker));
-
-  /* Check that the worker isn't in the list of blocked workers. */
-  RAY_CHECK(!worker_in_vector(algorithm_state->blocked_workers, worker));
-
-  /* If the worker was executing a task, it must have finished, so remove it
-   * from the list of executing workers. If the worker is connecting for the
-   * first time, it will not be in the list of executing workers. */
-  remove_worker_from_vector(algorithm_state->executing_workers, worker);
-  /* Double check that we successfully removed the worker. */
-  RAY_CHECK(!worker_in_vector(algorithm_state->executing_workers, worker));
-
-  /* Add worker to the list of available workers. */
-  algorithm_state->available_workers.push_back(worker);
-
-  /* Try to dispatch tasks. */
-  dispatch_all_tasks(state, algorithm_state);
-}
-
-void handle_worker_removed(LocalSchedulerState *state,
-                           SchedulingAlgorithmState *algorithm_state,
-                           LocalSchedulerClient *worker) {
-  /* Make sure this is not an actor. */
-  RAY_CHECK(worker->actor_id.is_nil());
-
-  /* Make sure that we remove the worker at most once. */
-  int num_times_removed = 0;
-
-  /* Remove the worker from available workers, if it's there. */
-  bool removed_from_available =
-      remove_worker_from_vector(algorithm_state->available_workers, worker);
-  num_times_removed += removed_from_available;
-  /* Double check that we actually removed the worker. */
-  RAY_CHECK(!worker_in_vector(algorithm_state->available_workers, worker));
-
-  /* Remove the worker from executing workers, if it's there. */
-  bool removed_from_executing =
-      remove_worker_from_vector(algorithm_state->executing_workers, worker);
-  num_times_removed += removed_from_executing;
-  /* Double check that we actually removed the worker. */
-  RAY_CHECK(!worker_in_vector(algorithm_state->executing_workers, worker));
-
-  /* Remove the worker from blocked workers, if it's there. */
-  bool removed_from_blocked =
-      remove_worker_from_vector(algorithm_state->blocked_workers, worker);
-  num_times_removed += removed_from_blocked;
-  /* Double check that we actually removed the worker. */
-  RAY_CHECK(!worker_in_vector(algorithm_state->blocked_workers, worker));
-
-  /* Make sure we removed the worker at most once. */
-  RAY_CHECK(num_times_removed <= 1);
-
-  /* Attempt to dispatch some tasks because some resources may have freed up. */
-  dispatch_all_tasks(state, algorithm_state);
-}
-
-void handle_actor_worker_disconnect(LocalSchedulerState *state,
-                                    SchedulingAlgorithmState *algorithm_state,
-                                    LocalSchedulerClient *worker,
-                                    bool cleanup) {
-  /* Fail all in progress or queued tasks of the actor. */
-  if (!cleanup) {
-    if (state->db != NULL) {
-      actor_table_mark_removed(state->db, worker->actor_id);
-    }
-
-    if (worker->task_in_progress != NULL) {
-      finish_killed_task(state,
-                         *Task_task_execution_spec(worker->task_in_progress));
-    }
-
-    state->removed_actors.insert(worker->actor_id);
-
-    RAY_CHECK(algorithm_state->local_actor_infos.count(worker->actor_id) != 0);
-    LocalActorInfo &entry =
-        algorithm_state->local_actor_infos.find(worker->actor_id)->second;
-    for (auto &task : *entry.task_queue) {
-      finish_killed_task(state, task);
-    }
-  }
-
-  remove_actor(algorithm_state, worker->actor_id);
-
-  /* Attempt to dispatch some tasks because some resources may have freed up. */
-  dispatch_all_tasks(state, algorithm_state);
-
-  /* Start a worker to replace the removed actor's worker and replenish the
-   * worker pool. */
-  start_worker(state);
-}
-
-/* NOTE(swang): For tasks that saved a checkpoint, we should consider
- * overwriting the result table entries for the current task frontier to
- * avoid duplicate task submissions during reconstruction. */
-void handle_actor_worker_available(LocalSchedulerState *state,
-                                   SchedulingAlgorithmState *algorithm_state,
-                                   LocalSchedulerClient *worker) {
-  ActorID actor_id = worker->actor_id;
-  RAY_CHECK(!actor_id.is_nil());
-  /* Get the actor info for this worker. */
-  RAY_CHECK(algorithm_state->local_actor_infos.count(actor_id) == 1);
-  LocalActorInfo &entry =
-      algorithm_state->local_actor_infos.find(actor_id)->second;
-  RAY_CHECK(worker == entry.worker);
-  RAY_CHECK(!entry.worker_available);
-  /* If an actor task was assigned, mark returned dummy object as locally
-   * available. This is not added to the object table, so the update will be
-   * invisible to other nodes. */
-  /* NOTE(swang): These objects are never cleaned up. We should consider
-   * removing the objects, e.g., when an actor is terminated. */
-  if (!entry.execution_dependency.is_nil()) {
-    handle_object_available(state, algorithm_state, entry.execution_dependency);
-  }
-  /* Unset the fields indicating an assigned task. */
-  entry.worker_available = true;
-  /* Assign new tasks if possible. */
-  dispatch_all_tasks(state, algorithm_state);
-}
-
-void handle_worker_blocked(LocalSchedulerState *state,
-                           SchedulingAlgorithmState *algorithm_state,
-                           LocalSchedulerClient *worker) {
-  /* Find the worker in the list of executing workers. */
-  RAY_CHECK(
-      remove_worker_from_vector(algorithm_state->executing_workers, worker));
-
-  /* Check that the worker isn't in the list of blocked workers. */
-  RAY_CHECK(!worker_in_vector(algorithm_state->blocked_workers, worker));
-
-  /* Add the worker to the list of blocked workers. */
-  algorithm_state->blocked_workers.push_back(worker);
-
-  /* Try to dispatch tasks, since we may have freed up some resources. */
-  dispatch_all_tasks(state, algorithm_state);
-}
-
-void handle_actor_worker_blocked(LocalSchedulerState *state,
-                                 SchedulingAlgorithmState *algorithm_state,
-                                 LocalSchedulerClient *worker) {
-  /* The actor case doesn't use equivalents of the blocked_workers and
-   * executing_workers lists. Are these necessary? */
-  /* Try to dispatch tasks, since we may have freed up some resources. */
-  dispatch_all_tasks(state, algorithm_state);
-}
-
-void handle_worker_unblocked(LocalSchedulerState *state,
-                             SchedulingAlgorithmState *algorithm_state,
-                             LocalSchedulerClient *worker) {
-  /* Find the worker in the list of blocked workers. */
-  RAY_CHECK(
-      remove_worker_from_vector(algorithm_state->blocked_workers, worker));
-
-  /* Check that the worker isn't in the list of executing workers. */
-  RAY_CHECK(!worker_in_vector(algorithm_state->executing_workers, worker));
-
-  /* Add the worker to the list of executing workers. */
-  algorithm_state->executing_workers.push_back(worker);
-}
-
-void handle_actor_worker_unblocked(LocalSchedulerState *state,
-                                   SchedulingAlgorithmState *algorithm_state,
-                                   LocalSchedulerClient *worker) {}
-
-void handle_object_available(LocalSchedulerState *state,
-                             SchedulingAlgorithmState *algorithm_state,
-                             ObjectID object_id) {
-  auto object_entry_it = algorithm_state->remote_objects.find(object_id);
-
-  ObjectEntry entry;
-  /* Get the entry for this object from the active fetch request, or allocate
-   * one if needed. */
-  if (object_entry_it != algorithm_state->remote_objects.end()) {
-    /* Remove the object from the active fetch requests. */
-    entry = object_entry_it->second;
-    algorithm_state->remote_objects.erase(object_id);
-  }
-
-  /* Add the entry to the set of locally available objects. */
-  RAY_CHECK(algorithm_state->local_objects.count(object_id) == 0);
-  algorithm_state->local_objects[object_id] = entry;
-
-  if (!entry.dependent_tasks.empty()) {
-    /* Out of the tasks that were dependent on this object, if they are now
-     * ready to run, move them to the dispatch queue. */
-    for (auto &it : entry.dependent_tasks) {
-      if (can_run(algorithm_state, *it)) {
-        if (TaskSpec_is_actor_task(it->Spec())) {
-          insert_actor_task_queue(state, algorithm_state, std::move(*it));
-        } else {
-          algorithm_state->dispatch_task_queue->push_back(std::move(*it));
-        }
-        /* Remove the entry with a matching TaskSpec pointer from the waiting
-         * queue, but do not free the task spec. */
-        algorithm_state->waiting_task_queue->erase(it);
-      }
-    }
-    /* Try to dispatch tasks, since we may have added some from the waiting
-     * queue. */
-    dispatch_all_tasks(state, algorithm_state);
-    /* Clean up the records for dependent tasks. */
-    entry.dependent_tasks.clear();
-  }
-}
-
-void handle_object_removed(LocalSchedulerState *state,
-                           ObjectID removed_object_id) {
-  /* Remove the object from the set of locally available objects. */
-  SchedulingAlgorithmState *algorithm_state = state->algorithm_state;
-
-  RAY_CHECK(algorithm_state->local_objects.count(removed_object_id) == 1);
-  algorithm_state->local_objects.erase(removed_object_id);
-
-  /* Track queued tasks that were dependent on this object.
-   * NOTE: Since objects often get removed in batches (e.g., during eviction),
-   * we may end up iterating through the queues many times in a row. If this
-   * turns out to be a bottleneck, consider tracking dependencies even for
-   * tasks in the dispatch queue, or batching object notifications. */
-  /* Track the dependency for tasks that were in the dispatch queue. Remove
-   * these tasks from the dispatch queue and push them to the waiting queue. */
-  for (auto it = algorithm_state->dispatch_task_queue->begin();
-       it != algorithm_state->dispatch_task_queue->end();) {
-    if (it->DependsOn(removed_object_id)) {
-      /* This task was dependent on the removed object. */
-      RAY_LOG(DEBUG) << "Moved task from dispatch queue back to waiting queue";
-      algorithm_state->waiting_task_queue->push_back(std::move(*it));
-      /* Remove the task from the dispatch queue, but do not free the task
-       * spec. */
-      it = algorithm_state->dispatch_task_queue->erase(it);
-    } else {
-      /* The task can still run, so continue to the next task. */
-      ++it;
-    }
-  }
-
-  std::vector<ActorID> empty_actor_queues;
-  for (auto it = algorithm_state->actors_with_pending_tasks.begin();
-       it != algorithm_state->actors_with_pending_tasks.end(); it++) {
-    auto actor_info = algorithm_state->local_actor_infos[*it];
-    for (auto queue_it = actor_info.task_queue->begin();
-         queue_it != actor_info.task_queue->end();) {
-      if (queue_it->DependsOn(removed_object_id)) {
-        /* This task was dependent on the removed object. */
-        RAY_LOG(DEBUG) << "Moved task from actor dispatch queue back to "
-                       << "waiting queue";
-        algorithm_state->waiting_task_queue->push_back(std::move(*queue_it));
-        /* Remove the task from the dispatch queue, but do not free the task
-         * spec. */
-        queue_it = actor_info.task_queue->erase(queue_it);
-        if (actor_info.task_queue->size() == 0) {
-          empty_actor_queues.push_back(*it);
-        }
-      } else {
-        ++queue_it;
-      }
-    }
-  }
-  for (auto actor_id : empty_actor_queues) {
-    algorithm_state->actors_with_pending_tasks.erase(actor_id);
-  }
-
-  /* Track the dependency for tasks that are in the waiting queue, including
-   * those that were just moved from the dispatch queue. */
-  for (auto it = algorithm_state->waiting_task_queue->begin();
-       it != algorithm_state->waiting_task_queue->end(); ++it) {
-    int64_t num_dependencies = it->NumDependencies();
-    for (int64_t i = 0; i < num_dependencies; ++i) {
-      int count = it->DependencyIdCount(i);
-      for (int j = 0; j < count; ++j) {
-        ObjectID dependency_id = it->DependencyId(i, j);
-        if (dependency_id == removed_object_id) {
-          /* Do not request a transfer from other plasma managers if this is an
-           * execution dependency. */
-          bool request_transfer = it->IsStaticDependency(i);
-          fetch_missing_dependency(state, algorithm_state, it,
-                                   removed_object_id.to_plasma_id(),
-                                   request_transfer);
-        }
-      }
-    }
-  }
-}
-
-void handle_driver_removed(LocalSchedulerState *state,
-                           SchedulingAlgorithmState *algorithm_state,
-                           WorkerID driver_id) {
-  /* Loop over fetch requests. This must be done before we clean up the waiting
-   * task queue and the dispatch task queue because this map contains iterators
-   * for those lists, which will be invalidated when we clean up those lists.*/
-  for (auto it = algorithm_state->remote_objects.begin();
-       it != algorithm_state->remote_objects.end();) {
-    /* Loop over the tasks that are waiting for this object and remove the tasks
-     * for the removed driver. */
-    auto task_it_it = it->second.dependent_tasks.begin();
-    while (task_it_it != it->second.dependent_tasks.end()) {
-      /* If the dependent task was a task for the removed driver, remove it from
-       * this vector. */
-      TaskSpec *spec = (*task_it_it)->Spec();
-      if (TaskSpec_driver_id(spec) == driver_id) {
-        task_it_it = it->second.dependent_tasks.erase(task_it_it);
-      } else {
-        task_it_it++;
-      }
-    }
-    /* If there are no more dependent tasks for this object, then remove the
-     * ObjectEntry. */
-    if (it->second.dependent_tasks.size() == 0) {
-      it = algorithm_state->remote_objects.erase(it);
-    } else {
-      it++;
-    }
-  }
-
-  /* Remove this driver's tasks from the waiting task queue. */
-  auto it = algorithm_state->waiting_task_queue->begin();
-  while (it != algorithm_state->waiting_task_queue->end()) {
-    TaskSpec *spec = it->Spec();
-    if (TaskSpec_driver_id(spec) == driver_id) {
-      it = algorithm_state->waiting_task_queue->erase(it);
-    } else {
-      it++;
-    }
-  }
-
-  /* Remove this driver's tasks from the dispatch task queue. */
-  it = algorithm_state->dispatch_task_queue->begin();
-  while (it != algorithm_state->dispatch_task_queue->end()) {
-    TaskSpec *spec = it->Spec();
-    if (TaskSpec_driver_id(spec) == driver_id) {
-      it = algorithm_state->dispatch_task_queue->erase(it);
-    } else {
-      it++;
-    }
-  }
-
-  // Remove this driver's tasks from the cached actor tasks. Note that this loop
-  // could be very slow if the vector of cached actor tasks is very long.
-  for (auto it = algorithm_state->cached_submitted_actor_tasks.begin();
-       it != algorithm_state->cached_submitted_actor_tasks.end();) {
-    TaskSpec *spec = (*it).Spec();
-    if (TaskSpec_driver_id(spec) == driver_id) {
-      it = algorithm_state->cached_submitted_actor_tasks.erase(it);
-    } else {
-      ++it;
-    }
-  }
-
-  /* TODO(rkn): Should we clean up the actor data structures? */
-}
-
-int num_waiting_tasks(SchedulingAlgorithmState *algorithm_state) {
-  return algorithm_state->waiting_task_queue->size();
-}
-
-int num_dispatch_tasks(SchedulingAlgorithmState *algorithm_state) {
-  return algorithm_state->dispatch_task_queue->size();
-}
-
-void print_worker_info(const char *message,
-                       SchedulingAlgorithmState *algorithm_state) {
-  RAY_LOG(DEBUG) << message << ": " << algorithm_state->available_workers.size()
-                 << " available, " << algorithm_state->executing_workers.size()
-                 << " executing, " << algorithm_state->blocked_workers.size()
-                 << " blocked";
-}
-
-std::unordered_map<ActorHandleID, int64_t> get_actor_task_counters(
-    SchedulingAlgorithmState *algorithm_state,
-    ActorID actor_id) {
-  RAY_CHECK(algorithm_state->local_actor_infos.count(actor_id) != 0);
-  return algorithm_state->local_actor_infos[actor_id].task_counters;
-}
-
-void set_actor_task_counters(
-    SchedulingAlgorithmState *algorithm_state,
-    ActorID actor_id,
-    const std::unordered_map<ActorHandleID, int64_t> &task_counters) {
-  RAY_CHECK(algorithm_state->local_actor_infos.count(actor_id) != 0);
-  /* Overwrite the current task counters for the actor. This is necessary
-   * during reconstruction when resuming from a checkpoint so that we can
-   * resume the task frontier at the time that the checkpoint was saved. */
-  auto &entry = algorithm_state->local_actor_infos[actor_id];
-  entry.task_counters = task_counters;
-
-  /* Filter out tasks for the actor that were submitted earlier than the new
-   * task counter. These represent tasks that executed before the actor's
-   * resumed checkpoint, and therefore should not be re-executed. */
-  for (auto it = entry.task_queue->begin(); it != entry.task_queue->end();) {
-    /* Filter out duplicate tasks for the actor that are runnable. */
-    TaskSpec *pending_task_spec = it->Spec();
-    ActorHandleID handle_id = TaskSpec_actor_handle_id(pending_task_spec);
-    auto task_counter = entry.task_counters.find(handle_id);
-    if (task_counter != entry.task_counters.end() &&
-        TaskSpec_actor_counter(pending_task_spec) < task_counter->second) {
-      /* If the task's counter is less than the highest count for that handle,
-       * then remove it from the actor's runnable queue. */
-      it = entry.task_queue->erase(it);
-    } else {
-      it++;
-    }
-  }
-  for (auto it = algorithm_state->waiting_task_queue->begin();
-       it != algorithm_state->waiting_task_queue->end();) {
-    /* Filter out duplicate tasks for the actor that are waiting on a missing
-     * dependency. */
-    TaskSpec *spec = it->Spec();
-    if (TaskSpec_actor_id(spec) == actor_id &&
-        TaskSpec_actor_counter(spec) <
-            entry.task_counters[TaskSpec_actor_handle_id(spec)]) {
-      /* If the waiting task is for the same actor and its task counter is less
-       * than the highest count for that handle, then clear its object
-       * dependencies and remove it from the queue. */
-      clear_missing_dependencies(algorithm_state, it);
-      it = algorithm_state->waiting_task_queue->erase(it);
-    } else {
-      it++;
-    }
-  }
-}
-
-std::unordered_map<ActorHandleID, ObjectID> get_actor_frontier(
-    SchedulingAlgorithmState *algorithm_state,
-    ActorID actor_id) {
-  RAY_CHECK(algorithm_state->local_actor_infos.count(actor_id) != 0);
-  return algorithm_state->local_actor_infos[actor_id].frontier_dependencies;
-}
-
-void set_actor_frontier(
-    LocalSchedulerState *state,
-    SchedulingAlgorithmState *algorithm_state,
-    ActorID actor_id,
-    const std::unordered_map<ActorHandleID, ObjectID> &frontier_dependencies) {
-  RAY_CHECK(algorithm_state->local_actor_infos.count(actor_id) != 0);
-  auto entry = algorithm_state->local_actor_infos[actor_id];
-  entry.frontier_dependencies = frontier_dependencies;
-  for (auto frontier_dependency : entry.frontier_dependencies) {
-    if (algorithm_state->local_objects.count(frontier_dependency.second) == 0) {
-      handle_object_available(state, algorithm_state,
-                              frontier_dependency.second);
-    }
-  }
-}
diff --git a/src/local_scheduler/local_scheduler_algorithm.h b/src/local_scheduler/local_scheduler_algorithm.h
deleted file mode 100644
index 9238d5db58e55..0000000000000
--- a/src/local_scheduler/local_scheduler_algorithm.h
+++ /dev/null
@@ -1,438 +0,0 @@
-#ifndef LOCAL_SCHEDULER_ALGORITHM_H
-#define LOCAL_SCHEDULER_ALGORITHM_H
-
-#include "local_scheduler_shared.h"
-#include "common/task.h"
-#include "state/local_scheduler_table.h"
-
-/* ==== The scheduling algorithm ====
- *
- * This file contains declaration for all functions and data structures
- * that need to be provided if you want to implement a new algorithms
- * for the local scheduler.
- *
- */
-
-/**
- * Initialize the scheduler state.
- *
- * @return State managed by the scheduling algorithm.
- */
-SchedulingAlgorithmState *SchedulingAlgorithmState_init(void);
-
-/**
- * Free the scheduler state.
- *
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @return Void.
- */
-void SchedulingAlgorithmState_free(SchedulingAlgorithmState *algorithm_state);
-
-/**
- *
- */
-void provide_scheduler_info(LocalSchedulerState *state,
-                            SchedulingAlgorithmState *algorithm_state,
-                            LocalSchedulerInfo *info);
-
-/**
- * This function will be called when a new task is submitted by a worker for
- * execution. The task will either be:
- * 1. Put into the waiting queue, where it will wait for its dependencies to
- *    become available.
- * 2. Put into the dispatch queue, where it will wait for an available worker.
- * 3. Given to the global scheduler to be scheduled.
- *
- * Currently, the local scheduler policy is to keep the task if its
- * dependencies are ready and there is an available worker.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param task Task that is submitted by the worker.
- * @return Void.
- */
-void handle_task_submitted(LocalSchedulerState *state,
-                           SchedulingAlgorithmState *algorithm_state,
-                           TaskExecutionSpec &execution_spec);
-
-/**
- * This version of handle_task_submitted is used when the task being submitted
- * is a method of an actor.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param task Task that is submitted by the worker.
- * @return Void.
- */
-void handle_actor_task_submitted(LocalSchedulerState *state,
-                                 SchedulingAlgorithmState *algorithm_state,
-                                 TaskExecutionSpec &execution_spec);
-
-/**
- * This function will be called when the local scheduler receives a notification
- * about the creation of a new actor. This can be used by the scheduling
- * algorithm to resubmit cached actor tasks.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param actor_id The ID of the actor being created.
- * @return Void.
- */
-void handle_actor_creation_notification(
-    LocalSchedulerState *state,
-    SchedulingAlgorithmState *algorithm_state,
-    ActorID actor_id);
-
-/**
- * This function will be called when a task is assigned by the global scheduler
- * for execution on this local scheduler.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param task Task that is assigned by the global scheduler.
- * @return Void.
- */
-void handle_task_scheduled(LocalSchedulerState *state,
-                           SchedulingAlgorithmState *algorithm_state,
-                           TaskExecutionSpec &execution_spec);
-
-/**
- * This function will be called when an actor task is assigned by the global
- * scheduler or by another local scheduler for execution on this local
- * scheduler.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param task Task that is assigned by the global scheduler.
- * @return Void.
- */
-void handle_actor_task_scheduled(LocalSchedulerState *state,
-                                 SchedulingAlgorithmState *algorithm_state,
-                                 TaskExecutionSpec &execution_spec);
-
-/**
- * This function is called if a new object becomes available in the local
- * plasma store.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param object_id ID of the object that became available.
- * @return Void.
- */
-void handle_object_available(LocalSchedulerState *state,
-                             SchedulingAlgorithmState *algorithm_state,
-                             ObjectID object_id);
-
-/**
- * This function is called if an object is removed from the local plasma store.
- *
- * @param state The state of the local scheduler.
- * @param object_id ID of the object that was removed.
- * @return Void.
- */
-void handle_object_removed(LocalSchedulerState *state, ObjectID object_id);
-
-/**
- * This function is called when a new worker becomes available.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param worker The worker that is available.
- * @return Void.
- */
-void handle_worker_available(LocalSchedulerState *state,
-                             SchedulingAlgorithmState *algorithm_state,
-                             LocalSchedulerClient *worker);
-
-/**
- * This function is called when a worker is removed.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param worker The worker that is removed.
- * @return Void.
- */
-void handle_worker_removed(LocalSchedulerState *state,
-                           SchedulingAlgorithmState *algorithm_state,
-                           LocalSchedulerClient *worker);
-
-/**
- * This version of handle_worker_available is called whenever the worker that is
- * available is running an actor.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param worker The worker that is available.
- * @return Void.
- */
-void handle_actor_worker_available(LocalSchedulerState *state,
-                                   SchedulingAlgorithmState *algorithm_state,
-                                   LocalSchedulerClient *worker);
-
-/**
- * Handle the fact that a new worker is available for running an actor.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param actor_id The ID of the actor running on the worker.
- * @param initial_execution_dependency The dummy object ID of the actor
- *        creation task.
- * @param worker The worker that was converted to an actor.
- * @return Void.
- */
-void handle_convert_worker_to_actor(
-    LocalSchedulerState *state,
-    SchedulingAlgorithmState *algorithm_state,
-    const ActorID &actor_id,
-    const ObjectID &initial_execution_dependency,
-    LocalSchedulerClient *worker);
-
-/**
- * Handle the fact that a worker running an actor has disconnected.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param worker The worker that was disconnected.
- * @param cleanup Whether the disconnect was during cleanup.
- * @return Void.
- */
-void handle_actor_worker_disconnect(LocalSchedulerState *state,
-                                    SchedulingAlgorithmState *algorithm_state,
-                                    LocalSchedulerClient *worker,
-                                    bool cleanup);
-
-/**
- * This function is called when a worker that was executing a task becomes
- * blocked on an object that isn't available locally yet.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param worker The worker that is blocked.
- * @return Void.
- */
-void handle_worker_blocked(LocalSchedulerState *state,
-                           SchedulingAlgorithmState *algorithm_state,
-                           LocalSchedulerClient *worker);
-
-/**
- * This function is called when an actor that was executing a task becomes
- * blocked on an object that isn't available locally yet.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param worker The worker that is blocked.
- * @return Void.
- */
-void handle_actor_worker_blocked(LocalSchedulerState *state,
-                                 SchedulingAlgorithmState *algorithm_state,
-                                 LocalSchedulerClient *worker);
-
-/**
- * This function is called when a worker that was blocked on an object that
- * wasn't available locally yet becomes unblocked.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param worker The worker that is now unblocked.
- * @return Void.
- */
-void handle_worker_unblocked(LocalSchedulerState *state,
-                             SchedulingAlgorithmState *algorithm_state,
-                             LocalSchedulerClient *worker);
-
-/**
- * This function is called when an actor that was blocked on an object that
- * wasn't available locally yet becomes unblocked.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param worker The worker that is now unblocked.
- * @return Void.
- */
-void handle_actor_worker_unblocked(LocalSchedulerState *state,
-                                   SchedulingAlgorithmState *algorithm_state,
-                                   LocalSchedulerClient *worker);
-
-/**
- * Process the fact that a driver has been removed. This will remove all of the
- * tasks for that driver from the scheduling algorithm's internal data
- * structures.
- *
- * @param state The state of the local scheduler.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param driver_id The ID of the driver that was removed.
- * @return Void.
- */
-void handle_driver_removed(LocalSchedulerState *state,
-                           SchedulingAlgorithmState *algorithm_state,
-                           WorkerID driver_id);
-
-/**
- * This function fetches queued task's missing object dependencies. It is
- * called every local_scheduler_fetch_timeout_milliseconds.
- *
- * @param loop The local scheduler's event loop.
- * @param id The ID of the timer that triggers this function.
- * @param context The function's context.
- * @return An integer representing the time interval in seconds before the
- *         next invocation of the function.
- */
-int fetch_object_timeout_handler(event_loop *loop, timer_id id, void *context);
-
-/**
- * This function initiates reconstruction for task's missing object
- * dependencies. It is called every
- * local_scheduler_reconstruction_timeout_milliseconds, but it may not initiate
- * reconstruction for every missing object.
- *
- * @param loop The local scheduler's event loop.
- * @param id The ID of the timer that triggers this function.
- * @param context The function's context.
- * @return An integer representing the time interval in seconds before the
- *         next invocation of the function.
- */
-int reconstruct_object_timeout_handler(event_loop *loop,
-                                       timer_id id,
-                                       void *context);
-
-/// This function initiates reconstruction for the actor creation tasks
-/// corresponding to the actor tasks cached in the local scheduler.
-///
-/// \param loop The local scheduler's event loop.
-/// \param id The ID of the timer that triggers this function.
-/// \param context The function's context.
-/// \return An integer representing the time interval in seconds before the
-/// next invocation of the function.
-int rerun_actor_creation_tasks_timeout_handler(event_loop *loop,
-                                               timer_id id,
-                                               void *context);
-
-/**
- * Check whether an object, including actor dummy objects, is locally
- * available.
- *
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param object_id The ID of the object to check for.
- * @return A bool representing whether the object is locally available.
- */
-bool object_locally_available(SchedulingAlgorithmState *algorithm_state,
-                              ObjectID object_id);
-
-/// Spill some tasks back to the global scheduler. This function implements the
-/// spillback policy.
-///
-/// @param state The scheduler state.
-/// @return Void.
-void spillback_tasks_handler(LocalSchedulerState *state);
-
-/**
- * A helper function to print debug information about the current state and
- * number of workers.
- *
- * @param message A message to identify the log message.
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @return Void.
- */
-void print_worker_info(const char *message,
-                       SchedulingAlgorithmState *algorithm_state);
-
-/*
- * The actor frontier consists of the number of tasks executed so far and the
- * execution dependencies required by the current runnable tasks, according to
- * the actor's local scheduler. Since an actor may have multiple handles, the
- * tasks submitted to the actor form a DAG, where nodes are tasks and edges are
- * execution dependencies. The frontier is a cut across this DAG. The number of
- * tasks so far is the number of nodes included in the DAG root's partition.
- *
- * The actor gets the current frontier of tasks from the local scheduler during
- * a checkpoint save, so that it can save the point in the actor's lifetime at
- * which the checkpoint was taken. If the actor later resumes from that
- * checkpoint, the actor can set the current frontier of tasks in the local
- * scheduler so that the same frontier of tasks can be made runnable again
- * during reconstruction, and so that we do not duplicate execution of tasks
- * that already executed before the checkpoint.
- */
-
-/**
- * Get the number of tasks, per actor handle, that have been executed on an
- * actor so far.
- *
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param actor_id The ID of the actor whose task counters are returned.
- * @return A map from handle ID to the number of tasks submitted by that handle
- *         that have executed so far.
- */
-std::unordered_map<ActorHandleID, int64_t> get_actor_task_counters(
-    SchedulingAlgorithmState *algorithm_state,
-    ActorID actor_id);
-
-/**
- * Set the number of tasks, per actor handle, that have been executed on an
- * actor so far. All previous counts will be overwritten. Tasks that are
- * waiting or runnable on the local scheduler that have a lower task count will
- * be discarded, so that we don't duplicate execution.
- *
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param actor_id The ID of the actor whose task counters are returned.
- * @param task_counters A map from handle ID to the number of tasks submitted
- *        by that handle that have executed so far.
- * @return Void.
- */
-void set_actor_task_counters(
-    SchedulingAlgorithmState *algorithm_state,
-    ActorID actor_id,
-    const std::unordered_map<ActorHandleID, int64_t> &task_counters);
-
-/**
- * Get the actor's frontier of task dependencies.
- * NOTE(swang): The returned frontier only includes handles known by the local
- * scheduler. It does not include handles for which the local scheduler has not
- * seen a runnable task yet.
- *
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param actor_id The ID of the actor whose task counters are returned.
- * @return A map from handle ID to execution dependency for the earliest
- *         runnable task submitted through that handle.
- */
-std::unordered_map<ActorHandleID, ObjectID> get_actor_frontier(
-    SchedulingAlgorithmState *algorithm_state,
-    ActorID actor_id);
-
-/**
- * Set the actor's frontier of task dependencies. The previous frontier will be
- * overwritten. Any tasks that have an execution dependency on the new frontier
- * (and that have all other dependencies fulfilled) will become runnable.
- *
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @param actor_id The ID of the actor whose task counters are returned.
- * @param frontier_dependencies A map from handle ID to execution dependency
- *        for the earliest runnable task submitted through that handle.
- * @return Void.
- */
-void set_actor_frontier(
-    LocalSchedulerState *state,
-    SchedulingAlgorithmState *algorithm_state,
-    ActorID actor_id,
-    const std::unordered_map<ActorHandleID, ObjectID> &frontier_dependencies);
-
-/** The following methods are for testing purposes only. */
-#ifdef LOCAL_SCHEDULER_TEST
-/**
- * Get the number of tasks currently waiting for object dependencies to become
- * available locally.
- *
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @return The number of tasks queued.
- */
-int num_waiting_tasks(SchedulingAlgorithmState *algorithm_state);
-
-/**
- * Get the number of tasks currently waiting for a worker to become available.
- *
- * @param algorithm_state State maintained by the scheduling algorithm.
- * @return The number of tasks queued.
- */
-int num_dispatch_tasks(SchedulingAlgorithmState *algorithm_state);
-#endif
-
-#endif /* LOCAL_SCHEDULER_ALGORITHM_H */
diff --git a/src/local_scheduler/local_scheduler_client.cc b/src/local_scheduler/local_scheduler_client.cc
deleted file mode 100644
index 91b5fa9c9df1a..0000000000000
--- a/src/local_scheduler/local_scheduler_client.cc
+++ /dev/null
@@ -1,378 +0,0 @@
-#include "local_scheduler_client.h"
-
-#include "common_protocol.h"
-#include "format/local_scheduler_generated.h"
-#include "ray/raylet/format/node_manager_generated.h"
-
-#include "common/io.h"
-#include "common/task.h"
-#include <stdlib.h>
-#include <sys/types.h>
-#include <unistd.h>
-
-using MessageType = ray::local_scheduler::protocol::MessageType;
-
-LocalSchedulerConnection *LocalSchedulerConnection_init(
-    const char *local_scheduler_socket,
-    const UniqueID &client_id,
-    bool is_worker,
-    const JobID &driver_id,
-    bool use_raylet,
-    const Language &language) {
-  LocalSchedulerConnection *result = new LocalSchedulerConnection();
-  result->use_raylet = use_raylet;
-  result->conn = connect_ipc_sock_retry(local_scheduler_socket, -1, -1);
-
-  /* Register with the local scheduler.
-   * NOTE(swang): If the local scheduler exits and we are registered as a
-   * worker, we will get killed. */
-  flatbuffers::FlatBufferBuilder fbb;
-  if (use_raylet) {
-    auto message = ray::protocol::CreateRegisterClientRequest(
-        fbb, is_worker, to_flatbuf(fbb, client_id), getpid(),
-        to_flatbuf(fbb, driver_id), language);
-    fbb.Finish(message);
-  } else {
-    auto message = ray::local_scheduler::protocol::CreateRegisterClientRequest(
-        fbb, is_worker, to_flatbuf(fbb, client_id), getpid(),
-        to_flatbuf(fbb, driver_id));
-    fbb.Finish(message);
-  }
-  /* Register the process ID with the local scheduler. */
-  int success = write_message(
-      result->conn, static_cast<int64_t>(MessageType::RegisterClientRequest),
-      fbb.GetSize(), fbb.GetBufferPointer(), &result->write_mutex);
-  RAY_CHECK(success == 0) << "Unable to register worker with local scheduler";
-
-  return result;
-}
-
-void LocalSchedulerConnection_free(LocalSchedulerConnection *conn) {
-  close(conn->conn);
-  delete conn;
-}
-
-void local_scheduler_disconnect_client(LocalSchedulerConnection *conn) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = ray::local_scheduler::protocol::CreateDisconnectClient(fbb);
-  fbb.Finish(message);
-  write_message(conn->conn, static_cast<int64_t>(MessageType::DisconnectClient),
-                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
-}
-
-void local_scheduler_log_event(LocalSchedulerConnection *conn,
-                               uint8_t *key,
-                               int64_t key_length,
-                               uint8_t *value,
-                               int64_t value_length,
-                               double timestamp) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto key_string = fbb.CreateString((char *) key, key_length);
-  auto value_string = fbb.CreateString((char *) value, value_length);
-  auto message = ray::local_scheduler::protocol::CreateEventLogMessage(
-      fbb, key_string, value_string, timestamp);
-  fbb.Finish(message);
-  write_message(conn->conn, static_cast<int64_t>(MessageType::EventLogMessage),
-                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
-}
-
-void local_scheduler_submit(LocalSchedulerConnection *conn,
-                            const TaskExecutionSpec &execution_spec) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto execution_dependencies =
-      to_flatbuf(fbb, execution_spec.ExecutionDependencies());
-  auto task_spec =
-      fbb.CreateString(reinterpret_cast<char *>(execution_spec.Spec()),
-                       execution_spec.SpecSize());
-  auto message = ray::local_scheduler::protocol::CreateSubmitTaskRequest(
-      fbb, execution_dependencies, task_spec);
-  fbb.Finish(message);
-  write_message(conn->conn, static_cast<int64_t>(MessageType::SubmitTask),
-                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
-}
-
-void local_scheduler_submit_raylet(
-    LocalSchedulerConnection *conn,
-    const std::vector<ObjectID> &execution_dependencies,
-    const ray::raylet::TaskSpecification &task_spec) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto execution_dependencies_message = to_flatbuf(fbb, execution_dependencies);
-  auto message = ray::local_scheduler::protocol::CreateSubmitTaskRequest(
-      fbb, execution_dependencies_message, task_spec.ToFlatbuffer(fbb));
-  fbb.Finish(message);
-  write_message(conn->conn, static_cast<int64_t>(MessageType::SubmitTask),
-                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
-}
-
-TaskSpec *local_scheduler_get_task(LocalSchedulerConnection *conn,
-                                   int64_t *task_size) {
-  int64_t type;
-  int64_t reply_size;
-  uint8_t *reply;
-  {
-    std::unique_lock<std::mutex> guard(conn->mutex);
-    write_message(conn->conn, static_cast<int64_t>(MessageType::GetTask), 0,
-                  NULL, &conn->write_mutex);
-    /* Receive a task from the local scheduler. This will block until the local
-     * scheduler gives this client a task. */
-    read_message(conn->conn, &type, &reply_size, &reply);
-  }
-  if (type == static_cast<int64_t>(CommonMessageType::DISCONNECT_CLIENT)) {
-    RAY_LOG(DEBUG) << "Exiting because local scheduler closed connection.";
-    exit(1);
-  }
-  RAY_CHECK(static_cast<MessageType>(type) == MessageType::ExecuteTask);
-
-  /* Parse the flatbuffer object. */
-  auto reply_message =
-      flatbuffers::GetRoot<ray::local_scheduler::protocol::GetTaskReply>(reply);
-
-  /* Create a copy of the task spec so we can free the reply. */
-  *task_size = reply_message->task_spec()->size();
-  TaskSpec *data = (TaskSpec *) reply_message->task_spec()->data();
-  TaskSpec *spec = TaskSpec_copy(data, *task_size);
-
-  // Set the GPU IDs for this task. We only do this for non-actor tasks because
-  // for actors the GPUs are associated with the actor itself and not with the
-  // actor methods. Note that this also processes GPUs for actor creation tasks.
-  if (!TaskSpec_is_actor_task(spec)) {
-    conn->gpu_ids.clear();
-    for (size_t i = 0; i < reply_message->gpu_ids()->size(); ++i) {
-      conn->gpu_ids.push_back(reply_message->gpu_ids()->Get(i));
-    }
-  }
-
-  /* Free the original message from the local scheduler. */
-  free(reply);
-  /* Return the copy of the task spec and pass ownership to the caller. */
-  return spec;
-}
-
-// This is temporarily duplicated from local_scheduler_get_task while we have
-// the raylet and non-raylet code paths.
-TaskSpec *local_scheduler_get_task_raylet(LocalSchedulerConnection *conn,
-                                          int64_t *task_size) {
-  int64_t type;
-  int64_t reply_size;
-  uint8_t *reply;
-  {
-    std::unique_lock<std::mutex> guard(conn->mutex);
-    write_message(conn->conn, static_cast<int64_t>(MessageType::GetTask), 0,
-                  NULL, &conn->write_mutex);
-    // Receive a task from the local scheduler. This will block until the local
-    // scheduler gives this client a task.
-    read_message(conn->conn, &type, &reply_size, &reply);
-  }
-  if (type == static_cast<int64_t>(CommonMessageType::DISCONNECT_CLIENT)) {
-    RAY_LOG(DEBUG) << "Exiting because local scheduler closed connection.";
-    exit(1);
-  }
-  RAY_CHECK(type == static_cast<int64_t>(MessageType::ExecuteTask));
-
-  // Parse the flatbuffer object.
-  auto reply_message = flatbuffers::GetRoot<ray::protocol::GetTaskReply>(reply);
-
-  // Create a copy of the task spec so we can free the reply.
-  *task_size = reply_message->task_spec()->size();
-  const TaskSpec *data =
-      reinterpret_cast<const TaskSpec *>(reply_message->task_spec()->data());
-  TaskSpec *spec = TaskSpec_copy(const_cast<TaskSpec *>(data), *task_size);
-
-  // Set the resource IDs for this task.
-  conn->resource_ids_.clear();
-  for (size_t i = 0; i < reply_message->fractional_resource_ids()->size();
-       ++i) {
-    auto const &fractional_resource_ids =
-        reply_message->fractional_resource_ids()->Get(i);
-    auto &acquired_resources = conn->resource_ids_[string_from_flatbuf(
-        *fractional_resource_ids->resource_name())];
-
-    size_t num_resource_ids = fractional_resource_ids->resource_ids()->size();
-    size_t num_resource_fractions =
-        fractional_resource_ids->resource_fractions()->size();
-    RAY_CHECK(num_resource_ids == num_resource_fractions);
-    RAY_CHECK(num_resource_ids > 0);
-    for (size_t j = 0; j < num_resource_ids; ++j) {
-      int64_t resource_id = fractional_resource_ids->resource_ids()->Get(j);
-      double resource_fraction =
-          fractional_resource_ids->resource_fractions()->Get(j);
-      if (num_resource_ids > 1) {
-        int64_t whole_fraction = resource_fraction;
-        RAY_CHECK(whole_fraction == resource_fraction);
-      }
-      acquired_resources.push_back(
-          std::make_pair(resource_id, resource_fraction));
-    }
-  }
-
-  // Free the original message from the local scheduler.
-  free(reply);
-  // Return the copy of the task spec and pass ownership to the caller.
-  return spec;
-}
-
-void local_scheduler_task_done(LocalSchedulerConnection *conn) {
-  write_message(conn->conn, static_cast<int64_t>(MessageType::TaskDone), 0,
-                NULL, &conn->write_mutex);
-}
-
-void local_scheduler_reconstruct_objects(
-    LocalSchedulerConnection *conn,
-    const std::vector<ObjectID> &object_ids,
-    bool fetch_only) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto object_ids_message = to_flatbuf(fbb, object_ids);
-  auto message = ray::local_scheduler::protocol::CreateReconstructObjects(
-      fbb, object_ids_message, fetch_only);
-  fbb.Finish(message);
-  write_message(conn->conn,
-                static_cast<int64_t>(MessageType::ReconstructObjects),
-                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
-  /* TODO(swang): Propagate the error. */
-}
-
-void local_scheduler_log_message(LocalSchedulerConnection *conn) {
-  write_message(conn->conn, static_cast<int64_t>(MessageType::EventLogMessage),
-                0, NULL, &conn->write_mutex);
-}
-
-void local_scheduler_notify_unblocked(LocalSchedulerConnection *conn) {
-  write_message(conn->conn, static_cast<int64_t>(MessageType::NotifyUnblocked),
-                0, NULL, &conn->write_mutex);
-}
-
-void local_scheduler_put_object(LocalSchedulerConnection *conn,
-                                TaskID task_id,
-                                ObjectID object_id) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = ray::local_scheduler::protocol::CreatePutObject(
-      fbb, to_flatbuf(fbb, task_id), to_flatbuf(fbb, object_id));
-  fbb.Finish(message);
-
-  write_message(conn->conn, static_cast<int64_t>(MessageType::PutObject),
-                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
-}
-
-const std::vector<uint8_t> local_scheduler_get_actor_frontier(
-    LocalSchedulerConnection *conn,
-    ActorID actor_id) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = ray::local_scheduler::protocol::CreateGetActorFrontierRequest(
-      fbb, to_flatbuf(fbb, actor_id));
-  fbb.Finish(message);
-  int64_t type;
-  std::vector<uint8_t> reply;
-  {
-    std::unique_lock<std::mutex> guard(conn->mutex);
-    write_message(conn->conn,
-                  static_cast<int64_t>(MessageType::GetActorFrontierRequest),
-                  fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
-
-    read_vector(conn->conn, &type, reply);
-  }
-  if (static_cast<CommonMessageType>(type) ==
-      CommonMessageType::DISCONNECT_CLIENT) {
-    RAY_LOG(DEBUG) << "Exiting because local scheduler closed connection.";
-    exit(1);
-  }
-  RAY_CHECK(static_cast<MessageType>(type) ==
-            MessageType::GetActorFrontierReply);
-  return reply;
-}
-
-void local_scheduler_set_actor_frontier(LocalSchedulerConnection *conn,
-                                        const std::vector<uint8_t> &frontier) {
-  write_message(conn->conn, static_cast<int64_t>(MessageType::SetActorFrontier),
-                frontier.size(), const_cast<uint8_t *>(frontier.data()),
-                &conn->write_mutex);
-}
-
-std::pair<std::vector<ObjectID>, std::vector<ObjectID>> local_scheduler_wait(
-    LocalSchedulerConnection *conn,
-    const std::vector<ObjectID> &object_ids,
-    int num_returns,
-    int64_t timeout_milliseconds,
-    bool wait_local) {
-  // Write request.
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = ray::protocol::CreateWaitRequest(
-      fbb, to_flatbuf(fbb, object_ids), num_returns, timeout_milliseconds,
-      wait_local);
-  fbb.Finish(message);
-  int64_t type;
-  int64_t reply_size;
-  uint8_t *reply;
-  {
-    std::unique_lock<std::mutex> guard(conn->mutex);
-    write_message(conn->conn,
-                  static_cast<int64_t>(ray::protocol::MessageType::WaitRequest),
-                  fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
-    // Read result.
-    read_message(conn->conn, &type, &reply_size, &reply);
-  }
-  RAY_CHECK(static_cast<ray::protocol::MessageType>(type) ==
-            ray::protocol::MessageType::WaitReply);
-  auto reply_message = flatbuffers::GetRoot<ray::protocol::WaitReply>(reply);
-  // Convert result.
-  std::pair<std::vector<ObjectID>, std::vector<ObjectID>> result;
-  auto found = reply_message->found();
-  for (uint i = 0; i < found->size(); i++) {
-    ObjectID object_id = ObjectID::from_binary(found->Get(i)->str());
-    result.first.push_back(object_id);
-  }
-  auto remaining = reply_message->remaining();
-  for (uint i = 0; i < remaining->size(); i++) {
-    ObjectID object_id = ObjectID::from_binary(remaining->Get(i)->str());
-    result.second.push_back(object_id);
-  }
-  /* Free the original message from the local scheduler. */
-  free(reply);
-  return result;
-}
-
-void local_scheduler_push_error(LocalSchedulerConnection *conn,
-                                const JobID &job_id,
-                                const std::string &type,
-                                const std::string &error_message,
-                                double timestamp) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = ray::protocol::CreatePushErrorRequest(
-      fbb, to_flatbuf(fbb, job_id), fbb.CreateString(type),
-      fbb.CreateString(error_message), timestamp);
-  fbb.Finish(message);
-
-  write_message(conn->conn, static_cast<int64_t>(
-                                ray::protocol::MessageType::PushErrorRequest),
-                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
-}
-
-void local_scheduler_push_profile_events(
-    LocalSchedulerConnection *conn,
-    const ProfileTableDataT &profile_events) {
-  flatbuffers::FlatBufferBuilder fbb;
-
-  auto message = CreateProfileTableData(fbb, &profile_events);
-  fbb.Finish(message);
-
-  write_message(conn->conn,
-                static_cast<int64_t>(
-                    ray::protocol::MessageType::PushProfileEventsRequest),
-                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
-}
-
-void local_scheduler_free_objects_in_object_store(
-    LocalSchedulerConnection *conn,
-    const std::vector<ray::ObjectID> &object_ids,
-    bool local_only) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = ray::protocol::CreateFreeObjectsRequest(
-      fbb, local_only, to_flatbuf(fbb, object_ids));
-  fbb.Finish(message);
-
-  int success = write_message(
-      conn->conn,
-      static_cast<int64_t>(
-          ray::protocol::MessageType::FreeObjectsInObjectStoreRequest),
-      fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
-  RAY_CHECK(success == 0) << "Failed to write message to raylet.";
-}
diff --git a/src/local_scheduler/local_scheduler_client.h b/src/local_scheduler/local_scheduler_client.h
deleted file mode 100644
index bb4fdb345896c..0000000000000
--- a/src/local_scheduler/local_scheduler_client.h
+++ /dev/null
@@ -1,260 +0,0 @@
-#ifndef LOCAL_SCHEDULER_CLIENT_H
-#define LOCAL_SCHEDULER_CLIENT_H
-
-#include <mutex>
-
-#include "common/task.h"
-#include "local_scheduler_shared.h"
-#include "ray/raylet/task_spec.h"
-
-struct LocalSchedulerConnection {
-  /// True if we should use the raylet code path and false otherwise.
-  bool use_raylet;
-  /** File descriptor of the Unix domain socket that connects to local
-   *  scheduler. */
-  int conn;
-  /** The IDs of the GPUs that this client can use. NOTE(rkn): This is only used
-   *  by legacy Ray and will be deprecated. */
-  std::vector<int> gpu_ids;
-  /// A map from resource name to the resource IDs that are currently reserved
-  /// for this worker. Each pair consists of the resource ID and the fraction
-  /// of that resource allocated for this worker.
-  std::unordered_map<std::string, std::vector<std::pair<int64_t, double>>>
-      resource_ids_;
-  /// A mutex to protect stateful operations of the local scheduler client.
-  std::mutex mutex;
-  /// A mutext to protect write operations of the local scheduler client.
-  std::mutex write_mutex;
-};
-
-/**
- * Connect to the local scheduler.
- *
- * @param local_scheduler_socket The name of the socket to use to connect to the
- *        local scheduler.
- * @param worker_id A unique ID to represent the worker.
- * @param is_worker Whether this client is a worker. If it is a worker, an
- *        additional message will be sent to register as one.
- * @param driver_id The ID of the driver. This is non-nil if the client is a
- *        driver.
- * @param use_raylet True if we should use the raylet code path and false
- *        otherwise.
- * @return The connection information.
- */
-LocalSchedulerConnection *LocalSchedulerConnection_init(
-    const char *local_scheduler_socket,
-    const UniqueID &worker_id,
-    bool is_worker,
-    const JobID &driver_id,
-    bool use_raylet,
-    const Language &language);
-
-/**
- * Disconnect from the local scheduler.
- *
- * @param conn Local scheduler connection information returned by
- *        LocalSchedulerConnection_init.
- * @return Void.
- */
-void LocalSchedulerConnection_free(LocalSchedulerConnection *conn);
-
-/**
- * Submit a task to the local scheduler.
- *
- * @param conn The connection information.
- * @param execution_spec The execution spec for the task to submit.
- * @return Void.
- */
-void local_scheduler_submit(LocalSchedulerConnection *conn,
-                            const TaskExecutionSpec &execution_spec);
-
-/// Submit a task using the raylet code path.
-///
-/// \param The connection information.
-/// \param The execution dependencies.
-/// \param The task specification.
-/// \return Void.
-void local_scheduler_submit_raylet(
-    LocalSchedulerConnection *conn,
-    const std::vector<ObjectID> &execution_dependencies,
-    const ray::raylet::TaskSpecification &task_spec);
-
-/**
- * Notify the local scheduler that this client is disconnecting gracefully. This
- * is used by actors to exit gracefully so that the local scheduler doesn't
- * propagate an error message to the driver.
- *
- * @param conn The connection information.
- * @return Void.
- */
-void local_scheduler_disconnect_client(LocalSchedulerConnection *conn);
-
-/**
- * Log an event to the event log. This will call RPUSH key value. We use RPUSH
- * instead of SET so that it is possible to flush the log multiple times with
- * the same key (for example the key might be shared across logging calls in the
- * same task on a worker).
- *
- * @param conn The connection information.
- * @param key The key to store the event in.
- * @param key_length The length of the key.
- * @param value The value to store.
- * @param value_length The length of the value.
- * @param timestamp The time that the event is logged.
- * @return Void.
- */
-void local_scheduler_log_event(LocalSchedulerConnection *conn,
-                               uint8_t *key,
-                               int64_t key_length,
-                               uint8_t *value,
-                               int64_t value_length,
-                               double timestamp);
-
-/**
- * Get next task for this client. This will block until the scheduler assigns
- * a task to this worker. This allocates and returns a task, and so the task
- * must be freed by the caller.
- *
- * @todo When does this actually get freed?
- *
- * @param conn The connection information.
- * @param task_size A pointer to fill out with the task size.
- * @return The address of the assigned task.
- */
-TaskSpec *local_scheduler_get_task(LocalSchedulerConnection *conn,
-                                   int64_t *task_size);
-
-/// Get next task for this client. This will block until the scheduler assigns
-/// a task to this worker. This allocates and returns a task, and so the task
-/// must be freed by the caller.
-///
-/// \param conn The connection information.
-/// \param task_size A pointer to fill out with the task size.
-/// \return The address of the assigned task.
-TaskSpec *local_scheduler_get_task_raylet(LocalSchedulerConnection *conn,
-                                          int64_t *task_size);
-
-/**
- * Tell the local scheduler that the client has finished executing a task.
- *
- * @param conn The connection information.
- * @return Void.
- */
-void local_scheduler_task_done(LocalSchedulerConnection *conn);
-
-/**
- * Tell the local scheduler to reconstruct or fetch objects.
- *
- * @param conn The connection information.
- * @param object_ids The IDs of the objects to reconstruct.
- * @param fetch_only Only fetch objects, do not reconstruct them.
- * @return Void.
- */
-void local_scheduler_reconstruct_objects(
-    LocalSchedulerConnection *conn,
-    const std::vector<ObjectID> &object_ids,
-    bool fetch_only = false);
-
-/**
- * Send a log message to the local scheduler.
- *
- * @param conn The connection information.
- * @return Void.
- */
-void local_scheduler_log_message(LocalSchedulerConnection *conn);
-
-/**
- * Notify the local scheduler that this client (worker) is no longer blocked.
- *
- * @param conn The connection information.
- * @return Void.
- */
-void local_scheduler_notify_unblocked(LocalSchedulerConnection *conn);
-
-/**
- * Record the mapping from object ID to task ID for put events.
- *
- * @param conn The connection information.
- * @param task_id The ID of the task that called put.
- * @param object_id The ID of the object being stored.
- * @return Void.
- */
-void local_scheduler_put_object(LocalSchedulerConnection *conn,
-                                TaskID task_id,
-                                ObjectID object_id);
-
-/**
- * Get an actor's current task frontier.
- *
- * @param conn The connection information.
- * @param actor_id The ID of the actor whose frontier is returned.
- * @return A byte vector that can be traversed as an ActorFrontier flatbuffer.
- */
-const std::vector<uint8_t> local_scheduler_get_actor_frontier(
-    LocalSchedulerConnection *conn,
-    ActorID actor_id);
-
-/**
- * Set an actor's current task frontier.
- *
- * @param conn The connection information.
- * @param frontier An ActorFrontier flatbuffer to set the frontier to.
- * @return Void.
- */
-void local_scheduler_set_actor_frontier(LocalSchedulerConnection *conn,
-                                        const std::vector<uint8_t> &frontier);
-
-/// Wait for the given objects until timeout expires or num_return objects are
-/// found.
-///
-/// \param conn The connection information.
-/// \param object_ids The objects to wait for.
-/// \param num_returns The number of objects to wait for.
-/// \param timeout_milliseconds Duration, in milliseconds, to wait before
-/// returning.
-/// \param wait_local Whether to wait for objects to appear on this node.
-/// \return A pair with the first element containing the object ids that were
-/// found, and the second element the objects that were not found.
-std::pair<std::vector<ObjectID>, std::vector<ObjectID>> local_scheduler_wait(
-    LocalSchedulerConnection *conn,
-    const std::vector<ObjectID> &object_ids,
-    int num_returns,
-    int64_t timeout_milliseconds,
-    bool wait_local);
-
-/// Push an error to the relevant driver.
-///
-/// \param conn The connection information.
-/// \param The ID of the job that the error is for.
-/// \param The type of the error.
-/// \param The error message.
-/// \param The timestamp of the error.
-/// \return Void.
-void local_scheduler_push_error(LocalSchedulerConnection *conn,
-                                const JobID &job_id,
-                                const std::string &type,
-                                const std::string &error_message,
-                                double timestamp);
-
-/// Store some profile events in the GCS.
-///
-/// \param conn The connection information.
-/// \param profile_events A batch of profiling event information.
-/// \return Void.
-void local_scheduler_push_profile_events(
-    LocalSchedulerConnection *conn,
-    const ProfileTableDataT &profile_events);
-
-/// Free a list of objects from object stores.
-///
-/// \param conn The connection information.
-/// \param object_ids A list of ObjectsIDs to be deleted.
-/// \param local_only Whether keep this request with local object store
-/// or send it to all the object stores.
-/// \return Void.
-void local_scheduler_free_objects_in_object_store(
-    LocalSchedulerConnection *conn,
-    const std::vector<ray::ObjectID> &object_ids,
-    bool local_only);
-
-#endif
diff --git a/src/local_scheduler/local_scheduler_shared.h b/src/local_scheduler/local_scheduler_shared.h
deleted file mode 100644
index 572f14a6fdf73..0000000000000
--- a/src/local_scheduler/local_scheduler_shared.h
+++ /dev/null
@@ -1,137 +0,0 @@
-#ifndef LOCAL_SCHEDULER_SHARED_H
-#define LOCAL_SCHEDULER_SHARED_H
-
-#include "common/task.h"
-#include "common/state/table.h"
-#include "common/state/db.h"
-#include "plasma/client.h"
-#include "ray/gcs/client.h"
-
-#include <list>
-#include <unordered_map>
-#include <unordered_set>
-#include <vector>
-
-/** This struct is used to maintain a mapping from actor IDs to the ID of the
- *  local scheduler that is responsible for the actor. */
-struct ActorMapEntry {
-  /** The ID of the driver that created the actor. */
-  WorkerID driver_id;
-  /** The ID of the local scheduler that is responsible for the actor. */
-  DBClientID local_scheduler_id;
-};
-
-/** Internal state of the scheduling algorithm. */
-typedef struct SchedulingAlgorithmState SchedulingAlgorithmState;
-
-struct LocalSchedulerClient;
-
-/** A struct storing the configuration state of the local scheduler. This should
- *  consist of values that don't change over the lifetime of the local
- *  scheduler. */
-typedef struct {
-  /** The script to use when starting a new worker. */
-  const char **start_worker_command;
-  /** Whether there is a global scheduler. */
-  bool global_scheduler_exists;
-} local_scheduler_config;
-
-/** The state of the local scheduler. */
-struct LocalSchedulerState {
-  /** The configuration for the local scheduler. */
-  local_scheduler_config config;
-  /** The local scheduler event loop. */
-  event_loop *loop;
-  /** List of workers available to this node. This is used to free the worker
-   *  structs when we free the scheduler state and also to access the worker
-   *  structs in the tests. */
-  std::list<LocalSchedulerClient *> workers;
-  /** A set of driver IDs corresponding to drivers that have been removed. This
-   *  is used to make sure we don't execute any tasks belong to dead drivers. */
-  std::unordered_set<WorkerID> removed_drivers;
-  /** A set of actors IDs corresponding to local actors that have been removed.
-   * This ensures we can reject any tasks destined for dead actors. */
-  std::unordered_set<ActorID> removed_actors;
-  /** List of the process IDs for child processes (workers) started by the
-   *  local scheduler that have not sent a REGISTER_PID message yet. */
-  std::vector<pid_t> child_pids;
-  /** A hash table mapping actor IDs to the db_client_id of the local scheduler
-   *  that is responsible for the actor. */
-  std::unordered_map<ActorID, ActorMapEntry> actor_mapping;
-  /** The handle to the database. */
-  DBHandle *db;
-  /** The Plasma client. */
-  plasma::PlasmaClient *plasma_conn;
-  /** State for the scheduling algorithm. */
-  SchedulingAlgorithmState *algorithm_state;
-  /** Input buffer, used for reading input in process_message to avoid
-   *  allocation for each call to process_message. */
-  std::vector<uint8_t> input_buffer;
-  /** Vector of static attributes associated with the node owned by this local
-   *  scheduler. */
-  std::unordered_map<std::string, double> static_resources;
-  /** Vector of dynamic attributes associated with the node owned by this local
-   *  scheduler. */
-  std::unordered_map<std::string, double> dynamic_resources;
-  /** The IDs of the available GPUs. There is redundancy here in that
-   *  available_gpus.size() == dynamic_resources[ResourceIndex_GPU] should
-   *  always be true. */
-  std::vector<int> available_gpus;
-  /** The time (in milliseconds since the Unix epoch) when the most recent
-   *  heartbeat was sent. */
-  int64_t previous_heartbeat_time;
-};
-
-/** Contains all information associated with a local scheduler client. */
-struct LocalSchedulerClient {
-  /** The socket used to communicate with the client. */
-  int sock;
-  /** True if the client has registered and false otherwise. */
-  bool registered;
-  /** True if the client has sent a disconnect message to the local scheduler
-   *  and false otherwise. If this is true, then the local scheduler will not
-   *  propagate an error message to the driver when the client exits. */
-  bool disconnected;
-  /** True if the client is a worker and false if it is a driver. */
-  bool is_worker;
-  /** The worker ID if the client is a worker and the driver ID if the client is
-   *  a driver. */
-  WorkerID client_id;
-  /** A pointer to the task object that is currently running on this client. If
-   *  no task is running on the worker, this will be NULL. This is used to
-   *  update the task table. */
-  Task *task_in_progress;
-  /** An array of resource counts currently in use by the worker.  */
-  std::unordered_map<std::string, double> resources_in_use;
-  /** A vector of the IDs of the GPUs that the worker is currently using. If the
-   *  worker is an actor, this will be constant throughout the lifetime of the
-   *  actor (and will be equal to the number of GPUs requested by the actor). If
-   *  the worker is not an actor, this will be constant for the duration of a
-   *  task and will have length equal to the number of GPUs requested by the
-   *  task (in particular it will not change if the task blocks). */
-  std::vector<int> gpus_in_use;
-  /** A flag to indicate whether this worker is currently blocking on an
-   *  object(s) that isn't available locally yet. */
-  bool is_blocked;
-  /** The process ID of the client. If this is set to zero, the client has not
-   *  yet registered a process ID. */
-  pid_t pid;
-  /** Whether the client is a child process of the local scheduler. */
-  bool is_child;
-  /** The ID of the actor on this worker. If there is no actor running on this
-   *  worker, this should be NIL_ACTOR_ID. */
-  ActorID actor_id;
-  /** A pointer to the local scheduler state. */
-  LocalSchedulerState *local_scheduler_state;
-};
-
-/**
- * Free the local scheduler state. This disconnects all clients and notifies
- * the global scheduler of the local scheduler's exit.
- *
- * @param state The state to free.
- * @return Void
- */
-void LocalSchedulerState_free(LocalSchedulerState *state);
-
-#endif /* LOCAL_SCHEDULER_SHARED_H */
diff --git a/src/local_scheduler/test/local_scheduler_tests.cc b/src/local_scheduler/test/local_scheduler_tests.cc
deleted file mode 100644
index b155ea9494c84..0000000000000
--- a/src/local_scheduler/test/local_scheduler_tests.cc
+++ /dev/null
@@ -1,704 +0,0 @@
-#include "greatest.h"
-
-#include <assert.h>
-#include <unistd.h>
-#include <poll.h>
-#include <sys/types.h>
-#include <sys/socket.h>
-#include <sys/wait.h>
-
-#include <cstdio>
-#include <sstream>
-#include <string>
-#include <thread>
-
-#include "common.h"
-#include "test/test_common.h"
-#include "test/example_task.h"
-#include "event_loop.h"
-#include "io.h"
-#include "task.h"
-#include "state/object_table.h"
-#include "state/task_table.h"
-#include "state/redis.h"
-
-#include "local_scheduler_shared.h"
-#include "local_scheduler.h"
-#include "local_scheduler_algorithm.h"
-#include "local_scheduler_client.h"
-
-SUITE(local_scheduler_tests);
-
-TaskBuilder *g_task_builder = NULL;
-
-const char *plasma_store_socket_name = "/tmp/plasma_store_socket_1";
-const char *plasma_manager_socket_name_format = "/tmp/plasma_manager_socket_%d";
-const char *local_scheduler_socket_name_format =
-    "/tmp/local_scheduler_socket_%d";
-
-int64_t timeout_handler(event_loop *loop, int64_t id, void *context) {
-  event_loop_stop(loop);
-  return EVENT_LOOP_TIMER_DONE;
-}
-
-typedef struct {
-  /** A socket to mock the Plasma manager. Clients (such as workers) that
-   *  connect to this file descriptor must be accepted. */
-  int plasma_manager_fd;
-  /** A socket to communicate with the Plasma store. */
-  int plasma_store_fd;
-  /** Local scheduler's socket for IPC requests. */
-  int local_scheduler_fd;
-  /** Local scheduler's local scheduler state. */
-  LocalSchedulerState *local_scheduler_state;
-  /** Local scheduler's event loop. */
-  event_loop *loop;
-  /** Number of local scheduler client connections, or mock workers. */
-  int num_local_scheduler_conns;
-  /** Local scheduler client connections. */
-  LocalSchedulerConnection **conns;
-} LocalSchedulerMock;
-
-/**
- * Register clients of the local scheduler. This function is started in a
- * separate thread so enable a blocking call to register the clients.
- */
-static void register_clients(int num_mock_workers, LocalSchedulerMock *mock) {
-  for (int i = 0; i < num_mock_workers; ++i) {
-    new_client_connection(mock->loop, mock->local_scheduler_fd,
-                          (void *) mock->local_scheduler_state, 0);
-    LocalSchedulerClient *worker = mock->local_scheduler_state->workers.back();
-    process_message(mock->local_scheduler_state->loop, worker->sock, worker, 0);
-  }
-}
-
-LocalSchedulerMock *LocalSchedulerMock_init(int num_workers,
-                                            int num_mock_workers) {
-  const char *node_ip_address = "127.0.0.1";
-  const char *redis_addr = node_ip_address;
-  int redis_port = 6379;
-  std::unordered_map<std::string, double> static_resource_conf;
-  static_resource_conf["CPU"] = INT16_MAX;
-  static_resource_conf["GPU"] = 0;
-  LocalSchedulerMock *mock =
-      (LocalSchedulerMock *) malloc(sizeof(LocalSchedulerMock));
-  memset(mock, 0, sizeof(LocalSchedulerMock));
-  mock->loop = event_loop_create();
-  /* Bind to the local scheduler port and initialize the local scheduler. */
-  std::string plasma_manager_socket_name = bind_ipc_sock_retry(
-      plasma_manager_socket_name_format, &mock->plasma_manager_fd);
-  mock->plasma_store_fd =
-      connect_ipc_sock_retry(plasma_store_socket_name, 5, 100);
-  std::string local_scheduler_socket_name = bind_ipc_sock_retry(
-      local_scheduler_socket_name_format, &mock->local_scheduler_fd);
-  RAY_CHECK(mock->plasma_store_fd >= 0 && mock->local_scheduler_fd >= 0);
-
-  /* Construct worker command */
-  std::stringstream worker_command_ss;
-  worker_command_ss << "python ../python/ray/workers/default_worker.py"
-                    << " --node-ip-address=" << node_ip_address
-                    << " --object-store-name=" << plasma_store_socket_name
-                    << " --object-store-manager-name="
-                    << plasma_manager_socket_name
-                    << " --local-scheduler-name=" << local_scheduler_socket_name
-                    << " --redis-address=" << redis_addr << ":" << redis_port;
-  std::string worker_command = worker_command_ss.str();
-
-  mock->local_scheduler_state = LocalSchedulerState_init(
-      "127.0.0.1", mock->loop, redis_addr, redis_port,
-      local_scheduler_socket_name.c_str(), plasma_store_socket_name,
-      plasma_manager_socket_name.c_str(), NULL, false, static_resource_conf,
-      worker_command.c_str(), num_workers);
-
-  /* Accept the workers as clients to the plasma manager. */
-  for (int i = 0; i < num_workers; ++i) {
-    accept_client(mock->plasma_manager_fd);
-  }
-
-  /* Connect a local scheduler client. */
-  mock->num_local_scheduler_conns = num_mock_workers;
-  mock->conns = (LocalSchedulerConnection **) malloc(
-      sizeof(LocalSchedulerConnection *) * num_mock_workers);
-
-  std::thread background_thread =
-      std::thread(register_clients, num_mock_workers, mock);
-
-  for (int i = 0; i < num_mock_workers; ++i) {
-    mock->conns[i] = LocalSchedulerConnection_init(
-        local_scheduler_socket_name.c_str(), WorkerID::nil(), true,
-        JobID::nil(), false, Language::PYTHON);
-  }
-
-  background_thread.join();
-
-  return mock;
-}
-
-void LocalSchedulerMock_free(LocalSchedulerMock *mock) {
-  /* Disconnect clients. */
-  for (int i = 0; i < mock->num_local_scheduler_conns; ++i) {
-    LocalSchedulerConnection_free(mock->conns[i]);
-  }
-  free(mock->conns);
-
-  /* Kill all the workers and run the event loop again so that the task table
-   * updates propagate and the tasks in progress are freed. */
-  while (mock->local_scheduler_state->workers.size() > 0) {
-    LocalSchedulerClient *worker = mock->local_scheduler_state->workers.front();
-    kill_worker(mock->local_scheduler_state, worker, true, false);
-  }
-  event_loop_add_timer(mock->loop, 500,
-                       (event_loop_timer_handler) timeout_handler, NULL);
-  event_loop_run(mock->loop);
-
-  /* This also frees mock->loop. */
-  LocalSchedulerState_free(mock->local_scheduler_state);
-  close(mock->plasma_store_fd);
-  close(mock->plasma_manager_fd);
-  free(mock);
-}
-
-void reset_worker(LocalSchedulerMock *mock, LocalSchedulerClient *worker) {
-  if (worker->task_in_progress) {
-    Task_free(worker->task_in_progress);
-    worker->task_in_progress = NULL;
-  }
-}
-
-/**
- * Test that object reconstruction gets called. If a task gets submitted,
- * assigned to a worker, and then reconstruction is triggered for its return
- * value, the task should get assigned to a worker again.
- */
-TEST object_reconstruction_test(void) {
-  LocalSchedulerMock *local_scheduler = LocalSchedulerMock_init(0, 1);
-  LocalSchedulerConnection *worker = local_scheduler->conns[0];
-
-  /* Create a task with zero dependencies and one return value. */
-  TaskExecutionSpec execution_spec = example_task_execution_spec(0, 1);
-  TaskSpec *spec = execution_spec.Spec();
-  int64_t task_size = execution_spec.SpecSize();
-  ObjectID return_id = TaskSpec_return(spec, 0);
-
-  /* Add an empty object table entry for the object we want to reconstruct, to
-   * simulate it having been created and evicted. */
-  const char *client_id = "clientid";
-  /* Lookup the shard locations for the object table. */
-  std::vector<std::string> db_shards_addresses;
-  std::vector<int> db_shards_ports;
-  redisContext *context = redisConnect("127.0.0.1", 6379);
-  get_redis_shards(context, db_shards_addresses, db_shards_ports);
-  redisFree(context);
-  /* There should only be one shard, so we can safely add the empty object
-   * table entry to the first one.  */
-  ASSERT(db_shards_addresses.size() == 1);
-  context = redisConnect(db_shards_addresses[0].c_str(), db_shards_ports[0]);
-  redisReply *reply = (redisReply *) redisCommand(
-      context, "RAY.OBJECT_TABLE_ADD %b %ld %b %s", return_id.data(),
-      sizeof(return_id), 1, NIL_DIGEST, (size_t) DIGEST_SIZE, client_id);
-  freeReplyObject(reply);
-  reply = (redisReply *) redisCommand(context, "RAY.OBJECT_TABLE_REMOVE %b %s",
-                                      return_id.data(), sizeof(return_id),
-                                      client_id);
-  freeReplyObject(reply);
-  redisFree(context);
-
-  pid_t pid = fork();
-  if (pid == 0) {
-    /* Make sure we receive the task twice. First from the initial submission,
-     * and second from the reconstruct request. */
-    int64_t task_assigned_size;
-    local_scheduler_submit(worker, execution_spec);
-    TaskSpec *task_assigned =
-        local_scheduler_get_task(worker, &task_assigned_size);
-    ASSERT_EQ(memcmp(task_assigned, spec, task_size), 0);
-    ASSERT_EQ(task_assigned_size, task_size);
-    int64_t reconstruct_task_size;
-    TaskSpec *reconstruct_task =
-        local_scheduler_get_task(worker, &reconstruct_task_size);
-    ASSERT_EQ(memcmp(reconstruct_task, spec, task_size), 0);
-    ASSERT_EQ(reconstruct_task_size, task_size);
-    /* Clean up. */
-    free(reconstruct_task);
-    free(task_assigned);
-    LocalSchedulerMock_free(local_scheduler);
-    exit(0);
-  } else {
-    /* Run the event loop. NOTE: OSX appears to require the parent process to
-     * listen for events on the open file descriptors. */
-    event_loop_add_timer(local_scheduler->loop, 500,
-                         (event_loop_timer_handler) timeout_handler, NULL);
-    event_loop_run(local_scheduler->loop);
-    /* Set the task's status to TaskStatus::DONE to prevent the race condition
-     * that would suppress object reconstruction. */
-    Task *task = Task_alloc(
-        execution_spec, TaskStatus::DONE,
-        get_db_client_id(local_scheduler->local_scheduler_state->db));
-    task_table_add_task(local_scheduler->local_scheduler_state->db, task, NULL,
-                        NULL, NULL);
-
-    /* Trigger reconstruction, and run the event loop again. */
-    ObjectID return_id = TaskSpec_return(spec, 0);
-    local_scheduler_reconstruct_objects(worker,
-                                        std::vector<ObjectID>({return_id}));
-    event_loop_add_timer(local_scheduler->loop, 500,
-                         (event_loop_timer_handler) timeout_handler, NULL);
-    event_loop_run(local_scheduler->loop);
-    /* Wait for the child process to exit and check that there are no tasks
-     * left in the local scheduler's task queue. Then, clean up. */
-    wait(NULL);
-    ASSERT_EQ(num_waiting_tasks(
-                  local_scheduler->local_scheduler_state->algorithm_state),
-              0);
-    ASSERT_EQ(num_dispatch_tasks(
-                  local_scheduler->local_scheduler_state->algorithm_state),
-              0);
-    LocalSchedulerMock_free(local_scheduler);
-    PASS();
-  }
-}
-
-/**
- * Test that object reconstruction gets recursively called. In a chain of
- * tasks, if all inputs are lost, then reconstruction of the final object
- * should trigger reconstruction of all previous tasks in the lineage.
- */
-TEST object_reconstruction_recursive_test(void) {
-  LocalSchedulerMock *local_scheduler = LocalSchedulerMock_init(0, 1);
-  LocalSchedulerConnection *worker = local_scheduler->conns[0];
-  /* Create a chain of tasks, each one dependent on the one before it. Mark
-   * each object as available so that tasks will run immediately. */
-  const int NUM_TASKS = 10;
-  std::vector<TaskExecutionSpec> specs;
-  specs.push_back(example_task_execution_spec(0, 1));
-  for (int i = 1; i < NUM_TASKS; ++i) {
-    ObjectID arg_id = TaskSpec_return(specs[i - 1].Spec(), 0);
-    specs.push_back(example_task_execution_spec_with_args(1, 1, &arg_id));
-  }
-  /* Lookup the shard locations for the object table. */
-  const char *client_id = "clientid";
-  std::vector<std::string> db_shards_addresses;
-  std::vector<int> db_shards_ports;
-  redisContext *context = redisConnect("127.0.0.1", 6379);
-  get_redis_shards(context, db_shards_addresses, db_shards_ports);
-  redisFree(context);
-  /* There should only be one shard, so we can safely add the empty object
-   * table entry to the first one.  */
-  ASSERT(db_shards_addresses.size() == 1);
-  context = redisConnect(db_shards_addresses[0].c_str(), db_shards_ports[0]);
-  for (int i = 0; i < NUM_TASKS; ++i) {
-    ObjectID return_id = TaskSpec_return(specs[i].Spec(), 0);
-    redisReply *reply = (redisReply *) redisCommand(
-        context, "RAY.OBJECT_TABLE_ADD %b %ld %b %s", return_id.data(),
-        sizeof(return_id), 1, NIL_DIGEST, (size_t) DIGEST_SIZE, client_id);
-    freeReplyObject(reply);
-    reply = (redisReply *) redisCommand(
-        context, "RAY.OBJECT_TABLE_REMOVE %b %s", return_id.data(),
-        sizeof(return_id), client_id);
-    freeReplyObject(reply);
-  }
-  redisFree(context);
-
-  pid_t pid = fork();
-  if (pid == 0) {
-    /* Submit the tasks, and make sure each one gets assigned to a worker. */
-    for (int i = 0; i < NUM_TASKS; ++i) {
-      local_scheduler_submit(worker, specs[i]);
-    }
-    /* Make sure we receive each task from the initial submission. */
-    for (int i = 0; i < NUM_TASKS; ++i) {
-      int64_t task_size;
-      TaskSpec *task_assigned = local_scheduler_get_task(worker, &task_size);
-      ASSERT_EQ(memcmp(task_assigned, specs[i].Spec(), specs[i].SpecSize()), 0);
-      ASSERT_EQ(task_size, specs[i].SpecSize());
-      free(task_assigned);
-    }
-    /* Check that the workers receive all tasks in the final return object's
-     * lineage during reconstruction. */
-    for (int i = 0; i < NUM_TASKS; ++i) {
-      int64_t task_assigned_size;
-      TaskSpec *task_assigned =
-          local_scheduler_get_task(worker, &task_assigned_size);
-      for (auto it = specs.begin(); it != specs.end(); it++) {
-        if (memcmp(task_assigned, it->Spec(), task_assigned_size) == 0) {
-          specs.erase(it);
-          break;
-        }
-      }
-      free(task_assigned);
-    }
-    ASSERT(specs.size() == 0);
-    LocalSchedulerMock_free(local_scheduler);
-    exit(0);
-  } else {
-    /* Simulate each task putting its return values in the object store so that
-     * the next task can run. */
-    for (int i = 0; i < NUM_TASKS; ++i) {
-      ObjectID return_id = TaskSpec_return(specs[i].Spec(), 0);
-      handle_object_available(
-          local_scheduler->local_scheduler_state,
-          local_scheduler->local_scheduler_state->algorithm_state, return_id);
-    }
-    /* Run the event loop. All tasks should now be dispatched. NOTE: OSX
-     * appears to require the parent process to listen for events on the open
-     * file descriptors. */
-    event_loop_add_timer(local_scheduler->loop, 500,
-                         (event_loop_timer_handler) timeout_handler, NULL);
-    event_loop_run(local_scheduler->loop);
-    /* Set the final task's status to TaskStatus::DONE to prevent the race
-     * condition that would suppress object reconstruction. */
-    Task *last_task = Task_alloc(
-        specs[NUM_TASKS - 1], TaskStatus::DONE,
-        get_db_client_id(local_scheduler->local_scheduler_state->db));
-    task_table_add_task(local_scheduler->local_scheduler_state->db, last_task,
-                        NULL, NULL, NULL);
-    /* Simulate eviction of the objects, so that reconstruction is required. */
-    for (int i = 0; i < NUM_TASKS; ++i) {
-      ObjectID return_id = TaskSpec_return(specs[i].Spec(), 0);
-      handle_object_removed(local_scheduler->local_scheduler_state, return_id);
-    }
-    /* Trigger reconstruction for the last object. */
-    ObjectID return_id = TaskSpec_return(specs[NUM_TASKS - 1].Spec(), 0);
-    local_scheduler_reconstruct_objects(worker,
-                                        std::vector<ObjectID>({return_id}));
-    /* Run the event loop again. All tasks should be resubmitted. */
-    event_loop_add_timer(local_scheduler->loop, 500,
-                         (event_loop_timer_handler) timeout_handler, NULL);
-    event_loop_run(local_scheduler->loop);
-    /* Simulate each task putting its return values in the object store so that
-     * the next task can run. */
-    for (int i = 0; i < NUM_TASKS; ++i) {
-      ObjectID return_id = TaskSpec_return(specs[i].Spec(), 0);
-      handle_object_available(
-          local_scheduler->local_scheduler_state,
-          local_scheduler->local_scheduler_state->algorithm_state, return_id);
-    }
-    /* Run the event loop again. All tasks should be dispatched again. */
-    event_loop_add_timer(local_scheduler->loop, 500,
-                         (event_loop_timer_handler) timeout_handler, NULL);
-    event_loop_run(local_scheduler->loop);
-    /* Wait for the child process to exit and check that there are no tasks
-     * left in the local scheduler's task queue. Then, clean up. */
-    wait(NULL);
-    ASSERT_EQ(num_waiting_tasks(
-                  local_scheduler->local_scheduler_state->algorithm_state),
-              0);
-    ASSERT_EQ(num_dispatch_tasks(
-                  local_scheduler->local_scheduler_state->algorithm_state),
-              0);
-    specs.clear();
-    LocalSchedulerMock_free(local_scheduler);
-    PASS();
-  }
-}
-
-/**
- * Test that object reconstruction gets suppressed when there is a location
- * listed for the object in the object table.
- */
-TaskExecutionSpec *object_reconstruction_suppression_spec;
-
-void object_reconstruction_suppression_callback(ObjectID object_id,
-                                                bool success,
-                                                void *user_context) {
-  RAY_CHECK(success);
-  /* Submit the task after adding the object to the object table. */
-  LocalSchedulerConnection *worker = (LocalSchedulerConnection *) user_context;
-  local_scheduler_submit(worker, *object_reconstruction_suppression_spec);
-}
-
-TEST object_reconstruction_suppression_test(void) {
-  LocalSchedulerMock *local_scheduler = LocalSchedulerMock_init(0, 1);
-  LocalSchedulerConnection *worker = local_scheduler->conns[0];
-
-  TaskExecutionSpec execution_spec = example_task_execution_spec(0, 1);
-  object_reconstruction_suppression_spec = &execution_spec;
-  ObjectID return_id =
-      TaskSpec_return(object_reconstruction_suppression_spec->Spec(), 0);
-  pid_t pid = fork();
-  if (pid == 0) {
-    /* Make sure we receive the task once. This will block until the
-     * object_table_add callback completes. */
-    int64_t task_assigned_size;
-    TaskSpec *task_assigned =
-        local_scheduler_get_task(worker, &task_assigned_size);
-    ASSERT_EQ(
-        memcmp(task_assigned, object_reconstruction_suppression_spec->Spec(),
-               object_reconstruction_suppression_spec->SpecSize()),
-        0);
-    /* Trigger a reconstruction. We will check that no tasks get queued as a
-     * result of this line in the event loop process. */
-    local_scheduler_reconstruct_objects(worker,
-                                        std::vector<ObjectID>({return_id}));
-    /* Clean up. */
-    free(task_assigned);
-    LocalSchedulerMock_free(local_scheduler);
-    exit(0);
-  } else {
-    /* Connect a plasma manager client so we can call object_table_add. */
-    std::vector<std::string> db_connect_args;
-    db_connect_args.push_back("manager_address");
-    db_connect_args.push_back("127.0.0.1:12346");
-    DBHandle *db = db_connect(std::string("127.0.0.1"), 6379, "plasma_manager",
-                              "127.0.0.1", db_connect_args);
-    db_attach(db, local_scheduler->loop, false);
-    /* Add the object to the object table. */
-    object_table_add(db, return_id, 1, (unsigned char *) NIL_DIGEST, NULL,
-                     object_reconstruction_suppression_callback,
-                     (void *) worker);
-    /* Run the event loop. NOTE: OSX appears to require the parent process to
-     * listen for events on the open file descriptors. */
-    event_loop_add_timer(local_scheduler->loop, 1000,
-                         (event_loop_timer_handler) timeout_handler, NULL);
-    event_loop_run(local_scheduler->loop);
-    /* Wait for the child process to exit and check that there are no tasks
-     * left in the local scheduler's task queue. Then, clean up. */
-    wait(NULL);
-    ASSERT_EQ(num_waiting_tasks(
-                  local_scheduler->local_scheduler_state->algorithm_state),
-              0);
-    ASSERT_EQ(num_dispatch_tasks(
-                  local_scheduler->local_scheduler_state->algorithm_state),
-              0);
-    db_disconnect(db);
-    LocalSchedulerMock_free(local_scheduler);
-    PASS();
-  }
-}
-
-TEST task_dependency_test(void) {
-  LocalSchedulerMock *local_scheduler = LocalSchedulerMock_init(0, 1);
-  LocalSchedulerState *state = local_scheduler->local_scheduler_state;
-  SchedulingAlgorithmState *algorithm_state = state->algorithm_state;
-  /* Get the first worker. */
-  LocalSchedulerClient *worker = state->workers.front();
-  TaskExecutionSpec execution_spec = example_task_execution_spec(1, 1);
-  TaskSpec *spec = execution_spec.Spec();
-  ObjectID oid = TaskSpec_arg_id(spec, 0, 0);
-
-  /* Check that the task gets queued in the waiting queue if the task is
-   * submitted, but the input and workers are not available. */
-  handle_task_submitted(state, algorithm_state, execution_spec);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 1);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  /* Once the input is available, the task gets moved to the dispatch queue. */
-  handle_object_available(state, algorithm_state, oid);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 1);
-  /* Once a worker is available, the task gets assigned. */
-  handle_worker_available(state, algorithm_state, worker);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  reset_worker(local_scheduler, worker);
-
-  /* Check that the task gets queued in the waiting queue if the task is
-   * submitted and a worker is available, but the input is not. */
-  handle_object_removed(state, oid);
-  handle_task_submitted(state, algorithm_state, execution_spec);
-  handle_worker_available(state, algorithm_state, worker);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 1);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  /* Once the input is available, the task gets assigned. */
-  handle_object_available(state, algorithm_state, oid);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  reset_worker(local_scheduler, worker);
-
-  /* Check that the task gets queued in the dispatch queue if the task is
-   * submitted and the input is available, but no worker is available yet. */
-  handle_task_submitted(state, algorithm_state, execution_spec);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 1);
-  /* Once a worker is available, the task gets assigned. */
-  handle_worker_available(state, algorithm_state, worker);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  reset_worker(local_scheduler, worker);
-
-  /* If an object gets removed, check the first scenario again, where the task
-   * gets queued in the waiting task if the task is submitted and a worker is
-   * available, but the input is not. */
-  handle_task_submitted(state, algorithm_state, execution_spec);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 1);
-  /* If the input is removed while a task is in the dispatch queue, the task
-   * gets moved back to the waiting queue. */
-  handle_object_removed(state, oid);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 1);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  /* Once the input is available, the task gets moved back to the dispatch
-   * queue. */
-  handle_object_available(state, algorithm_state, oid);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 1);
-  /* Once a worker is available, the task gets assigned. */
-  handle_worker_available(state, algorithm_state, worker);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-
-  LocalSchedulerMock_free(local_scheduler);
-  PASS();
-}
-
-TEST task_multi_dependency_test(void) {
-  LocalSchedulerMock *local_scheduler = LocalSchedulerMock_init(0, 1);
-  LocalSchedulerState *state = local_scheduler->local_scheduler_state;
-  SchedulingAlgorithmState *algorithm_state = state->algorithm_state;
-  /* Get the first worker. */
-  LocalSchedulerClient *worker = state->workers.front();
-  TaskExecutionSpec execution_spec = example_task_execution_spec(2, 1);
-  TaskSpec *spec = execution_spec.Spec();
-  ObjectID oid1 = TaskSpec_arg_id(spec, 0, 0);
-  ObjectID oid2 = TaskSpec_arg_id(spec, 1, 0);
-
-  /* Check that the task gets queued in the waiting queue if the task is
-   * submitted, but the inputs and workers are not available. */
-  handle_task_submitted(state, algorithm_state, execution_spec);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 1);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  /* Check that the task stays in the waiting queue if only one input becomes
-   * available. */
-  handle_object_available(state, algorithm_state, oid2);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 1);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  /* Once all inputs are available, the task is moved to the dispatch queue. */
-  handle_object_available(state, algorithm_state, oid1);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 1);
-  /* Once a worker is available, the task gets assigned. */
-  handle_worker_available(state, algorithm_state, worker);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  reset_worker(local_scheduler, worker);
-
-  /* Check that the task gets queued in the dispatch queue if the task is
-   * submitted and the inputs are available, but no worker is available yet. */
-  handle_task_submitted(state, algorithm_state, execution_spec);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 1);
-  /* If any input is removed while a task is in the dispatch queue, the task
-   * gets moved back to the waiting queue. */
-  handle_object_removed(state, oid1);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 1);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  handle_object_removed(state, oid2);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 1);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  /* Check that the task stays in the waiting queue if only one input becomes
-   * available. */
-  handle_object_available(state, algorithm_state, oid2);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 1);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  /* Check that the task stays in the waiting queue if the one input is
-   * unavailable again. */
-  handle_object_removed(state, oid2);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 1);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  /* Check that the task stays in the waiting queue if the other input becomes
-   * available. */
-  handle_object_available(state, algorithm_state, oid1);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 1);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  /* Once all inputs are available, the task is moved to the dispatch queue. */
-  handle_object_available(state, algorithm_state, oid2);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 1);
-  /* Once a worker is available, the task gets assigned. */
-  handle_worker_available(state, algorithm_state, worker);
-  ASSERT_EQ(num_waiting_tasks(algorithm_state), 0);
-  ASSERT_EQ(num_dispatch_tasks(algorithm_state), 0);
-  reset_worker(local_scheduler, worker);
-
-  LocalSchedulerMock_free(local_scheduler);
-  PASS();
-}
-
-TEST start_kill_workers_test(void) {
-  /* Start some workers. */
-  int num_workers = 4;
-  LocalSchedulerMock *local_scheduler = LocalSchedulerMock_init(num_workers, 0);
-  /* We start off with num_workers children processes, but no workers
-   * registered yet. */
-  ASSERT_EQ(local_scheduler->local_scheduler_state->child_pids.size(),
-            static_cast<size_t>(num_workers));
-  ASSERT_EQ(local_scheduler->local_scheduler_state->workers.size(), 0);
-
-  /* Make sure that each worker connects to the local_scheduler scheduler. This
-   * for loop will hang if one of the workers does not connect. */
-  for (int i = 0; i < num_workers; ++i) {
-    new_client_connection(local_scheduler->loop,
-                          local_scheduler->local_scheduler_fd,
-                          (void *) local_scheduler->local_scheduler_state, 0);
-  }
-
-  /* After handling each worker's initial connection, we should now have all
-   * workers accounted for, but we haven't yet matched up process IDs with our
-   * children processes. */
-  ASSERT_EQ(local_scheduler->local_scheduler_state->child_pids.size(),
-            static_cast<size_t>(num_workers));
-  ASSERT_EQ(local_scheduler->local_scheduler_state->workers.size(),
-            static_cast<size_t>(num_workers));
-
-  /* Each worker should register its process ID. */
-  for (auto const &worker : local_scheduler->local_scheduler_state->workers) {
-    process_message(local_scheduler->local_scheduler_state->loop, worker->sock,
-                    worker, 0);
-  }
-  ASSERT_EQ(local_scheduler->local_scheduler_state->child_pids.size(), 0);
-  ASSERT_EQ(local_scheduler->local_scheduler_state->workers.size(),
-            static_cast<size_t>(num_workers));
-
-  /* After killing a worker, its state is cleaned up. */
-  LocalSchedulerClient *worker =
-      local_scheduler->local_scheduler_state->workers.front();
-  kill_worker(local_scheduler->local_scheduler_state, worker, false, false);
-  ASSERT_EQ(local_scheduler->local_scheduler_state->child_pids.size(), 0);
-  ASSERT_EQ(local_scheduler->local_scheduler_state->workers.size(),
-            static_cast<size_t>(num_workers - 1));
-
-  /* Start a worker after the local scheduler has been initialized. */
-  start_worker(local_scheduler->local_scheduler_state);
-  /* Accept the workers as clients to the plasma manager. */
-  int new_worker_fd = accept_client(local_scheduler->plasma_manager_fd);
-  /* The new worker should register its process ID. */
-  ASSERT_EQ(local_scheduler->local_scheduler_state->child_pids.size(), 1);
-  ASSERT_EQ(local_scheduler->local_scheduler_state->workers.size(),
-            static_cast<size_t>(num_workers - 1));
-  /* Make sure the new worker connects to the local_scheduler scheduler. */
-  new_client_connection(local_scheduler->loop,
-                        local_scheduler->local_scheduler_fd,
-                        (void *) local_scheduler->local_scheduler_state, 0);
-  ASSERT_EQ(local_scheduler->local_scheduler_state->child_pids.size(), 1);
-  ASSERT_EQ(local_scheduler->local_scheduler_state->workers.size(),
-            static_cast<size_t>(num_workers));
-  /* Make sure that the new worker registers its process ID. */
-  worker = local_scheduler->local_scheduler_state->workers.back();
-  process_message(local_scheduler->local_scheduler_state->loop, worker->sock,
-                  worker, 0);
-  ASSERT_EQ(local_scheduler->local_scheduler_state->child_pids.size(), 0);
-  ASSERT_EQ(local_scheduler->local_scheduler_state->workers.size(),
-            static_cast<size_t>(num_workers));
-
-  /* Clean up. */
-  close(new_worker_fd);
-  LocalSchedulerMock_free(local_scheduler);
-  PASS();
-}
-
-SUITE(local_scheduler_tests) {
-  RUN_REDIS_TEST(object_reconstruction_test);
-  RUN_REDIS_TEST(object_reconstruction_recursive_test);
-  RUN_REDIS_TEST(object_reconstruction_suppression_test);
-  RUN_REDIS_TEST(task_dependency_test);
-  RUN_REDIS_TEST(task_multi_dependency_test);
-  RUN_REDIS_TEST(start_kill_workers_test);
-}
-
-GREATEST_MAIN_DEFS();
-
-int main(int argc, char **argv) {
-  g_task_builder = make_task_builder();
-  GREATEST_MAIN_BEGIN();
-  RUN_SUITE(local_scheduler_tests);
-  GREATEST_MAIN_END();
-}
diff --git a/src/local_scheduler/test/run_tests.sh b/src/local_scheduler/test/run_tests.sh
deleted file mode 100644
index 9c1d7be79b788..0000000000000
--- a/src/local_scheduler/test/run_tests.sh
+++ /dev/null
@@ -1,38 +0,0 @@
-#!/usr/bin/env bash
-
-# This needs to be run in the build tree, which is normally ray/build
-
-# Cause the script to exit if a single command fails.
-set -e
-
-LaunchRedis() {
-    port=$1
-    if [[ "${RAY_USE_NEW_GCS}" = "on" ]]; then
-        ./src/credis/redis/src/redis-server \
-            --loglevel warning \
-            --loadmodule ./src/credis/build/src/libmember.so \
-            --loadmodule ./src/common/redis_module/libray_redis_module.so \
-            --port $port &
-    else
-        ./src/common/thirdparty/redis/src/redis-server \
-            --loglevel warning \
-            --loadmodule ./src/common/redis_module/libray_redis_module.so \
-            --port $port &
-    fi
-}
-
-
-# Start the Redis shards.
-LaunchRedis 6379
-LaunchRedis 6380
-sleep 1s
-# Register the shard location with the primary shard.
-./src/common/thirdparty/redis/src/redis-cli set NumRedisShards 1
-./src/common/thirdparty/redis/src/redis-cli rpush RedisShards 127.0.0.1:6380
-
-./src/plasma/plasma_store_server -s /tmp/plasma_store_socket_1 -m 100000000 &
-sleep 0.5s
-./src/local_scheduler/local_scheduler_tests
-./src/common/thirdparty/redis/src/redis-cli shutdown
-./src/common/thirdparty/redis/src/redis-cli -p 6380 shutdown
-killall plasma_store_server
diff --git a/src/local_scheduler/test/run_valgrind.sh b/src/local_scheduler/test/run_valgrind.sh
deleted file mode 100644
index 6ff1dbe33c628..0000000000000
--- a/src/local_scheduler/test/run_valgrind.sh
+++ /dev/null
@@ -1,41 +0,0 @@
-#!/usr/bin/env bash
-
-# This needs to be run in the build tree, which is normally ray/build
-
-set -x
-
-# Cause the script to exit if a single command fails.
-set -e
-
-LaunchRedis() {
-    port=$1
-    if [[ "${RAY_USE_NEW_GCS}" = "on" ]]; then
-        ./src/credis/redis/src/redis-server \
-            --loglevel warning \
-            --loadmodule ./src/credis/build/src/libmember.so \
-            --loadmodule ./src/common/redis_module/libray_redis_module.so \
-            --port $port &
-    else
-        ./src/common/thirdparty/redis/src/redis-server \
-            --loglevel warning \
-            --loadmodule ./src/common/redis_module/libray_redis_module.so \
-            --port $port &
-    fi
-}
-
-
-# Start the Redis shards.
-LaunchRedis 6379
-LaunchRedis 6380
-sleep 1s
-
-# Register the shard location with the primary shard.
-./src/common/thirdparty/redis/src/redis-cli set NumRedisShards 1
-./src/common/thirdparty/redis/src/redis-cli rpush RedisShards 127.0.0.1:6380
-
-./src/plasma/plasma_store_server -s /tmp/plasma_store_socket_1 -m 100000000 &
-sleep 0.5s
-valgrind --track-origins=yes --leak-check=full --show-leak-kinds=all --leak-check-heuristics=stdstring --error-exitcode=1 ./src/local_scheduler/local_scheduler_tests
-./src/common/thirdparty/redis/src/redis-cli shutdown
-./src/common/thirdparty/redis/src/redis-cli -p 6380 shutdown
-killall plasma_store_server
diff --git a/src/plasma/CMakeLists.txt b/src/plasma/CMakeLists.txt
deleted file mode 100644
index 5037a54da3d71..0000000000000
--- a/src/plasma/CMakeLists.txt
+++ /dev/null
@@ -1,61 +0,0 @@
-cmake_minimum_required(VERSION 3.4)
-
-project(plasma)
-
-include_directories(${CMAKE_CURRENT_LIST_DIR})
-include_directories(${CMAKE_CURRENT_LIST_DIR}/thirdparty)
-
-set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} --std=c99 -O3")
-set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} --std=c++11 -O3 -Werror -Wall")
-
-if(UNIX AND NOT APPLE)
-  link_libraries(rt)
-endif()
-
-include_directories("${ARROW_INCLUDE_DIR}")
-
-set(PLASMA_FBS_SRC "${CMAKE_CURRENT_LIST_DIR}/format/plasma.fbs" "${CMAKE_CURRENT_LIST_DIR}/format/common.fbs")
-set(OUTPUT_DIR ${CMAKE_CURRENT_LIST_DIR}/format/)
-
-set(PLASMA_FBS_OUTPUT_FILES
-  "${OUTPUT_DIR}/plasma_generated.h"
-  "${OUTPUT_DIR}/common_generated.h")
-
-add_custom_target(gen_plasma_fbs DEPENDS ${PLASMA_FBS_OUTPUT_FILES})
-add_dependencies(gen_plasma_fbs arrow_ep)
-
-# Copy the fbs files from Arrow project to local directory.
-add_custom_command(
-  OUTPUT ${PLASMA_FBS_SRC}
-  COMMAND mkdir -p ${CMAKE_CURRENT_LIST_DIR}/format/
-  COMMAND cp ${ARROW_SOURCE_DIR}/cpp/src/plasma/format/plasma.fbs ${CMAKE_CURRENT_LIST_DIR}/format/
-  COMMAND cp ${ARROW_SOURCE_DIR}/cpp/src/plasma/format/common.fbs ${CMAKE_CURRENT_LIST_DIR}/format/
-  COMMENT "Copying ${PLASMA_FBS_SRC} to local"
-  VERBATIM)
-
-# Compile flatbuffers
-add_custom_command(
-  OUTPUT ${PLASMA_FBS_OUTPUT_FILES}
-  # The --gen-object-api flag generates a C++ class MessageT for each
-  # flatbuffers message Message, which can be used to store deserialized
-  # messages in data structures. This is currently used for ObjectInfo for
-  # example.
-  COMMAND ${FLATBUFFERS_COMPILER} -c -o ${OUTPUT_DIR} ${PLASMA_FBS_SRC} --gen-object-api --scoped-enums
-  DEPENDS ${PLASMA_FBS_SRC}
-  COMMENT "Running flatc compiler on ${PLASMA_FBS_SRC}"
-  VERBATIM)
-
-include_directories("${FLATBUFFERS_INCLUDE_DIR}")
-
-set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fPIC")
-
-add_executable(plasma_manager
-  plasma_manager.cc)
-add_dependencies(plasma_manager gen_plasma_fbs)
-
-target_link_libraries(plasma_manager common ${PLASMA_STATIC_LIB} ray_static ${ARROW_STATIC_LIB} -lpthread ${Boost_SYSTEM_LIBRARY})
-
-define_test(client_tests "")
-define_test(manager_tests "" plasma_manager.cc)
-target_link_libraries(manager_tests ${Boost_SYSTEM_LIBRARY})
-add_dependencies(manager_tests gen_plasma_fbs)
diff --git a/src/plasma/doc/plasma-doxy-config b/src/plasma/doc/plasma-doxy-config
deleted file mode 100644
index 9c291f8388833..0000000000000
--- a/src/plasma/doc/plasma-doxy-config
+++ /dev/null
@@ -1,2473 +0,0 @@
-# Doxyfile 1.8.13
-
-# This file describes the settings to be used by the documentation system
-# doxygen (www.doxygen.org) for a project.
-#
-# All text after a double hash (##) is considered a comment and is placed in
-# front of the TAG it is preceding.
-#
-# All text after a single hash (#) is considered a comment and will be ignored.
-# The format is:
-# TAG = value [value, ...]
-# For lists, items can also be appended using:
-# TAG += value [value, ...]
-# Values that contain spaces should be placed between quotes (\" \").
-
-#---------------------------------------------------------------------------
-# Project related configuration options
-#---------------------------------------------------------------------------
-
-# This tag specifies the encoding used for all characters in the config file
-# that follow. The default is UTF-8 which is also the encoding used for all text
-# before the first occurrence of this tag. Doxygen uses libiconv (or the iconv
-# built into libc) for the transcoding. See http://www.gnu.org/software/libiconv
-# for the list of possible encodings.
-# The default value is: UTF-8.
-
-DOXYFILE_ENCODING      = UTF-8
-
-# The PROJECT_NAME tag is a single word (or a sequence of words surrounded by
-# double-quotes, unless you are using Doxywizard) that should identify the
-# project for which the documentation is generated. This name is used in the
-# title of most generated pages and in a few other places.
-# The default value is: My Project.
-
-PROJECT_NAME           = "Plasma"
-
-# The PROJECT_NUMBER tag can be used to enter a project or revision number. This
-# could be handy for archiving the generated documentation or if some version
-# control system is used.
-
-PROJECT_NUMBER         =
-
-# Using the PROJECT_BRIEF tag one can provide an optional one line description
-# for a project that appears at the top of each page and should give viewer a
-# quick idea about the purpose of the project. Keep the description short.
-
-PROJECT_BRIEF          =
-
-# With the PROJECT_LOGO tag one can specify a logo or an icon that is included
-# in the documentation. The maximum height of the logo should not exceed 55
-# pixels and the maximum width should not exceed 200 pixels. Doxygen will copy
-# the logo to the output directory.
-
-PROJECT_LOGO           =
-
-# The OUTPUT_DIRECTORY tag is used to specify the (relative or absolute) path
-# into which the generated documentation will be written. If a relative path is
-# entered, it will be relative to the location where doxygen was started. If
-# left blank the current directory will be used.
-
-OUTPUT_DIRECTORY       =
-
-# If the CREATE_SUBDIRS tag is set to YES then doxygen will create 4096 sub-
-# directories (in 2 levels) under the output directory of each output format and
-# will distribute the generated files over these directories. Enabling this
-# option can be useful when feeding doxygen a huge amount of source files, where
-# putting all generated files in the same directory would otherwise causes
-# performance problems for the file system.
-# The default value is: NO.
-
-CREATE_SUBDIRS         = NO
-
-# If the ALLOW_UNICODE_NAMES tag is set to YES, doxygen will allow non-ASCII
-# characters to appear in the names of generated files. If set to NO, non-ASCII
-# characters will be escaped, for example _xE3_x81_x84 will be used for Unicode
-# U+3044.
-# The default value is: NO.
-
-ALLOW_UNICODE_NAMES    = NO
-
-# The OUTPUT_LANGUAGE tag is used to specify the language in which all
-# documentation generated by doxygen is written. Doxygen will use this
-# information to generate all constant output in the proper language.
-# Possible values are: Afrikaans, Arabic, Armenian, Brazilian, Catalan, Chinese,
-# Chinese-Traditional, Croatian, Czech, Danish, Dutch, English (United States),
-# Esperanto, Farsi (Persian), Finnish, French, German, Greek, Hungarian,
-# Indonesian, Italian, Japanese, Japanese-en (Japanese with English messages),
-# Korean, Korean-en (Korean with English messages), Latvian, Lithuanian,
-# Macedonian, Norwegian, Persian (Farsi), Polish, Portuguese, Romanian, Russian,
-# Serbian, Serbian-Cyrillic, Slovak, Slovene, Spanish, Swedish, Turkish,
-# Ukrainian and Vietnamese.
-# The default value is: English.
-
-OUTPUT_LANGUAGE        = English
-
-# If the BRIEF_MEMBER_DESC tag is set to YES, doxygen will include brief member
-# descriptions after the members that are listed in the file and class
-# documentation (similar to Javadoc). Set to NO to disable this.
-# The default value is: YES.
-
-BRIEF_MEMBER_DESC      = YES
-
-# If the REPEAT_BRIEF tag is set to YES, doxygen will prepend the brief
-# description of a member or function before the detailed description
-#
-# Note: If both HIDE_UNDOC_MEMBERS and BRIEF_MEMBER_DESC are set to NO, the
-# brief descriptions will be completely suppressed.
-# The default value is: YES.
-
-REPEAT_BRIEF           = YES
-
-# This tag implements a quasi-intelligent brief description abbreviator that is
-# used to form the text in various listings. Each string in this list, if found
-# as the leading text of the brief description, will be stripped from the text
-# and the result, after processing the whole list, is used as the annotated
-# text. Otherwise, the brief description is used as-is. If left blank, the
-# following values are used ($name is automatically replaced with the name of
-# the entity):The $name class, The $name widget, The $name file, is, provides,
-# specifies, contains, represents, a, an and the.
-
-ABBREVIATE_BRIEF       = "The $name class" \
-                         "The $name widget" \
-                         "The $name file" \
-                         is \
-                         provides \
-                         specifies \
-                         contains \
-                         represents \
-                         a \
-                         an \
-                         the
-
-# If the ALWAYS_DETAILED_SEC and REPEAT_BRIEF tags are both set to YES then
-# doxygen will generate a detailed section even if there is only a brief
-# description.
-# The default value is: NO.
-
-ALWAYS_DETAILED_SEC    = NO
-
-# If the INLINE_INHERITED_MEMB tag is set to YES, doxygen will show all
-# inherited members of a class in the documentation of that class as if those
-# members were ordinary class members. Constructors, destructors and assignment
-# operators of the base classes will not be shown.
-# The default value is: NO.
-
-INLINE_INHERITED_MEMB  = NO
-
-# If the FULL_PATH_NAMES tag is set to YES, doxygen will prepend the full path
-# before files name in the file list and in the header files. If set to NO the
-# shortest path that makes the file name unique will be used
-# The default value is: YES.
-
-FULL_PATH_NAMES        = YES
-
-# The STRIP_FROM_PATH tag can be used to strip a user-defined part of the path.
-# Stripping is only done if one of the specified strings matches the left-hand
-# part of the path. The tag can be used to show relative paths in the file list.
-# If left blank the directory from which doxygen is run is used as the path to
-# strip.
-#
-# Note that you can specify absolute paths here, but also relative paths, which
-# will be relative from the directory where doxygen is started.
-# This tag requires that the tag FULL_PATH_NAMES is set to YES.
-
-STRIP_FROM_PATH        =
-
-# The STRIP_FROM_INC_PATH tag can be used to strip a user-defined part of the
-# path mentioned in the documentation of a class, which tells the reader which
-# header file to include in order to use a class. If left blank only the name of
-# the header file containing the class definition is used. Otherwise one should
-# specify the list of include paths that are normally passed to the compiler
-# using the -I flag.
-
-STRIP_FROM_INC_PATH    =
-
-# If the SHORT_NAMES tag is set to YES, doxygen will generate much shorter (but
-# less readable) file names. This can be useful is your file systems doesn't
-# support long names like on DOS, Mac, or CD-ROM.
-# The default value is: NO.
-
-SHORT_NAMES            = NO
-
-# If the JAVADOC_AUTOBRIEF tag is set to YES then doxygen will interpret the
-# first line (until the first dot) of a Javadoc-style comment as the brief
-# description. If set to NO, the Javadoc-style will behave just like regular Qt-
-# style comments (thus requiring an explicit @brief command for a brief
-# description.)
-# The default value is: NO.
-
-JAVADOC_AUTOBRIEF      = NO
-
-# If the QT_AUTOBRIEF tag is set to YES then doxygen will interpret the first
-# line (until the first dot) of a Qt-style comment as the brief description. If
-# set to NO, the Qt-style will behave just like regular Qt-style comments (thus
-# requiring an explicit \brief command for a brief description.)
-# The default value is: NO.
-
-QT_AUTOBRIEF           = NO
-
-# The MULTILINE_CPP_IS_BRIEF tag can be set to YES to make doxygen treat a
-# multi-line C++ special comment block (i.e. a block of //! or /// comments) as
-# a brief description. This used to be the default behavior. The new default is
-# to treat a multi-line C++ comment block as a detailed description. Set this
-# tag to YES if you prefer the old behavior instead.
-#
-# Note that setting this tag to YES also means that rational rose comments are
-# not recognized any more.
-# The default value is: NO.
-
-MULTILINE_CPP_IS_BRIEF = NO
-
-# If the INHERIT_DOCS tag is set to YES then an undocumented member inherits the
-# documentation from any documented member that it re-implements.
-# The default value is: YES.
-
-INHERIT_DOCS           = YES
-
-# If the SEPARATE_MEMBER_PAGES tag is set to YES then doxygen will produce a new
-# page for each member. If set to NO, the documentation of a member will be part
-# of the file/class/namespace that contains it.
-# The default value is: NO.
-
-SEPARATE_MEMBER_PAGES  = NO
-
-# The TAB_SIZE tag can be used to set the number of spaces in a tab. Doxygen
-# uses this value to replace tabs by spaces in code fragments.
-# Minimum value: 1, maximum value: 16, default value: 4.
-
-TAB_SIZE               = 2
-
-# This tag can be used to specify a number of aliases that act as commands in
-# the documentation. An alias has the form:
-# name=value
-# For example adding
-# "sideeffect=@par Side Effects:\n"
-# will allow you to put the command \sideeffect (or @sideeffect) in the
-# documentation, which will result in a user-defined paragraph with heading
-# "Side Effects:". You can put \n's in the value part of an alias to insert
-# newlines.
-
-ALIASES                =
-
-# This tag can be used to specify a number of word-keyword mappings (TCL only).
-# A mapping has the form "name=value". For example adding "class=itcl::class"
-# will allow you to use the command class in the itcl::class meaning.
-
-TCL_SUBST              =
-
-# Set the OPTIMIZE_OUTPUT_FOR_C tag to YES if your project consists of C sources
-# only. Doxygen will then generate output that is more tailored for C. For
-# instance, some of the names that are used will be different. The list of all
-# members will be omitted, etc.
-# The default value is: NO.
-
-OPTIMIZE_OUTPUT_FOR_C  = NO
-
-# Set the OPTIMIZE_OUTPUT_JAVA tag to YES if your project consists of Java or
-# Python sources only. Doxygen will then generate output that is more tailored
-# for that language. For instance, namespaces will be presented as packages,
-# qualified scopes will look different, etc.
-# The default value is: NO.
-
-OPTIMIZE_OUTPUT_JAVA   = NO
-
-# Set the OPTIMIZE_FOR_FORTRAN tag to YES if your project consists of Fortran
-# sources. Doxygen will then generate output that is tailored for Fortran.
-# The default value is: NO.
-
-OPTIMIZE_FOR_FORTRAN   = NO
-
-# Set the OPTIMIZE_OUTPUT_VHDL tag to YES if your project consists of VHDL
-# sources. Doxygen will then generate output that is tailored for VHDL.
-# The default value is: NO.
-
-OPTIMIZE_OUTPUT_VHDL   = NO
-
-# Doxygen selects the parser to use depending on the extension of the files it
-# parses. With this tag you can assign which parser to use for a given
-# extension. Doxygen has a built-in mapping, but you can override or extend it
-# using this tag. The format is ext=language, where ext is a file extension, and
-# language is one of the parsers supported by doxygen: IDL, Java, Javascript,
-# C#, C, C++, D, PHP, Objective-C, Python, Fortran (fixed format Fortran:
-# FortranFixed, free formatted Fortran: FortranFree, unknown formatted Fortran:
-# Fortran. In the later case the parser tries to guess whether the code is fixed
-# or free formatted code, this is the default for Fortran type files), VHDL. For
-# instance to make doxygen treat .inc files as Fortran files (default is PHP),
-# and .f files as C (default is Fortran), use: inc=Fortran f=C.
-#
-# Note: For files without extension you can use no_extension as a placeholder.
-#
-# Note that for custom extensions you also need to set FILE_PATTERNS otherwise
-# the files are not read by doxygen.
-
-EXTENSION_MAPPING      =
-
-# If the MARKDOWN_SUPPORT tag is enabled then doxygen pre-processes all comments
-# according to the Markdown format, which allows for more readable
-# documentation. See http://daringfireball.net/projects/markdown/ for details.
-# The output of markdown processing is further processed by doxygen, so you can
-# mix doxygen, HTML, and XML commands with Markdown formatting. Disable only in
-# case of backward compatibilities issues.
-# The default value is: YES.
-
-MARKDOWN_SUPPORT       = YES
-
-# When the TOC_INCLUDE_HEADINGS tag is set to a non-zero value, all headings up
-# to that level are automatically included in the table of contents, even if
-# they do not have an id attribute.
-# Note: This feature currently applies only to Markdown headings.
-# Minimum value: 0, maximum value: 99, default value: 0.
-# This tag requires that the tag MARKDOWN_SUPPORT is set to YES.
-
-TOC_INCLUDE_HEADINGS   = 0
-
-# When enabled doxygen tries to link words that correspond to documented
-# classes, or namespaces to their corresponding documentation. Such a link can
-# be prevented in individual cases by putting a % sign in front of the word or
-# globally by setting AUTOLINK_SUPPORT to NO.
-# The default value is: YES.
-
-AUTOLINK_SUPPORT       = YES
-
-# If you use STL classes (i.e. std::string, std::vector, etc.) but do not want
-# to include (a tag file for) the STL sources as input, then you should set this
-# tag to YES in order to let doxygen match functions declarations and
-# definitions whose arguments contain STL classes (e.g. func(std::string);
-# versus func(std::string) {}). This also make the inheritance and collaboration
-# diagrams that involve STL classes more complete and accurate.
-# The default value is: NO.
-
-BUILTIN_STL_SUPPORT    = NO
-
-# If you use Microsoft's C++/CLI language, you should set this option to YES to
-# enable parsing support.
-# The default value is: NO.
-
-CPP_CLI_SUPPORT        = NO
-
-# Set the SIP_SUPPORT tag to YES if your project consists of sip (see:
-# http://www.riverbankcomputing.co.uk/software/sip/intro) sources only. Doxygen
-# will parse them like normal C++ but will assume all classes use public instead
-# of private inheritance when no explicit protection keyword is present.
-# The default value is: NO.
-
-SIP_SUPPORT            = NO
-
-# For Microsoft's IDL there are propget and propput attributes to indicate
-# getter and setter methods for a property. Setting this option to YES will make
-# doxygen to replace the get and set methods by a property in the documentation.
-# This will only work if the methods are indeed getting or setting a simple
-# type. If this is not the case, or you want to show the methods anyway, you
-# should set this option to NO.
-# The default value is: YES.
-
-IDL_PROPERTY_SUPPORT   = YES
-
-# If member grouping is used in the documentation and the DISTRIBUTE_GROUP_DOC
-# tag is set to YES then doxygen will reuse the documentation of the first
-# member in the group (if any) for the other members of the group. By default
-# all members of a group must be documented explicitly.
-# The default value is: NO.
-
-DISTRIBUTE_GROUP_DOC   = NO
-
-# If one adds a struct or class to a group and this option is enabled, then also
-# any nested class or struct is added to the same group. By default this option
-# is disabled and one has to add nested compounds explicitly via \ingroup.
-# The default value is: NO.
-
-GROUP_NESTED_COMPOUNDS = NO
-
-# Set the SUBGROUPING tag to YES to allow class member groups of the same type
-# (for instance a group of public functions) to be put as a subgroup of that
-# type (e.g. under the Public Functions section). Set it to NO to prevent
-# subgrouping. Alternatively, this can be done per class using the
-# \nosubgrouping command.
-# The default value is: YES.
-
-SUBGROUPING            = YES
-
-# When the INLINE_GROUPED_CLASSES tag is set to YES, classes, structs and unions
-# are shown inside the group in which they are included (e.g. using \ingroup)
-# instead of on a separate page (for HTML and Man pages) or section (for LaTeX
-# and RTF).
-#
-# Note that this feature does not work in combination with
-# SEPARATE_MEMBER_PAGES.
-# The default value is: NO.
-
-INLINE_GROUPED_CLASSES = NO
-
-# When the INLINE_SIMPLE_STRUCTS tag is set to YES, structs, classes, and unions
-# with only public data fields or simple typedef fields will be shown inline in
-# the documentation of the scope in which they are defined (i.e. file,
-# namespace, or group documentation), provided this scope is documented. If set
-# to NO, structs, classes, and unions are shown on a separate page (for HTML and
-# Man pages) or section (for LaTeX and RTF).
-# The default value is: NO.
-
-INLINE_SIMPLE_STRUCTS  = NO
-
-# When TYPEDEF_HIDES_STRUCT tag is enabled, a typedef of a struct, union, or
-# enum is documented as struct, union, or enum with the name of the typedef. So
-# typedef struct TypeS {} TypeT, will appear in the documentation as a struct
-# with name TypeT. When disabled the typedef will appear as a member of a file,
-# namespace, or class. And the struct will be named TypeS. This can typically be
-# useful for C code in case the coding convention dictates that all compound
-# types are typedef'ed and only the typedef is referenced, never the tag name.
-# The default value is: NO.
-
-TYPEDEF_HIDES_STRUCT   = NO
-
-# The size of the symbol lookup cache can be set using LOOKUP_CACHE_SIZE. This
-# cache is used to resolve symbols given their name and scope. Since this can be
-# an expensive process and often the same symbol appears multiple times in the
-# code, doxygen keeps a cache of pre-resolved symbols. If the cache is too small
-# doxygen will become slower. If the cache is too large, memory is wasted. The
-# cache size is given by this formula: 2^(16+LOOKUP_CACHE_SIZE). The valid range
-# is 0..9, the default is 0, corresponding to a cache size of 2^16=65536
-# symbols. At the end of a run doxygen will report the cache usage and suggest
-# the optimal cache size from a speed point of view.
-# Minimum value: 0, maximum value: 9, default value: 0.
-
-LOOKUP_CACHE_SIZE      = 0
-
-#---------------------------------------------------------------------------
-# Build related configuration options
-#---------------------------------------------------------------------------
-
-# If the EXTRACT_ALL tag is set to YES, doxygen will assume all entities in
-# documentation are documented, even if no documentation was available. Private
-# class members and static file members will be hidden unless the
-# EXTRACT_PRIVATE respectively EXTRACT_STATIC tags are set to YES.
-# Note: This will also disable the warnings about undocumented members that are
-# normally produced when WARNINGS is set to YES.
-# The default value is: NO.
-
-EXTRACT_ALL            = YES
-
-# If the EXTRACT_PRIVATE tag is set to YES, all private members of a class will
-# be included in the documentation.
-# The default value is: NO.
-
-EXTRACT_PRIVATE        = NO
-
-# If the EXTRACT_PACKAGE tag is set to YES, all members with package or internal
-# scope will be included in the documentation.
-# The default value is: NO.
-
-EXTRACT_PACKAGE        = NO
-
-# If the EXTRACT_STATIC tag is set to YES, all static members of a file will be
-# included in the documentation.
-# The default value is: NO.
-
-EXTRACT_STATIC         = NO
-
-# If the EXTRACT_LOCAL_CLASSES tag is set to YES, classes (and structs) defined
-# locally in source files will be included in the documentation. If set to NO,
-# only classes defined in header files are included. Does not have any effect
-# for Java sources.
-# The default value is: YES.
-
-EXTRACT_LOCAL_CLASSES  = YES
-
-# This flag is only useful for Objective-C code. If set to YES, local methods,
-# which are defined in the implementation section but not in the interface are
-# included in the documentation. If set to NO, only methods in the interface are
-# included.
-# The default value is: NO.
-
-EXTRACT_LOCAL_METHODS  = NO
-
-# If this flag is set to YES, the members of anonymous namespaces will be
-# extracted and appear in the documentation as a namespace called
-# 'anonymous_namespace{file}', where file will be replaced with the base name of
-# the file that contains the anonymous namespace. By default anonymous namespace
-# are hidden.
-# The default value is: NO.
-
-EXTRACT_ANON_NSPACES   = NO
-
-# If the HIDE_UNDOC_MEMBERS tag is set to YES, doxygen will hide all
-# undocumented members inside documented classes or files. If set to NO these
-# members will be included in the various overviews, but no documentation
-# section is generated. This option has no effect if EXTRACT_ALL is enabled.
-# The default value is: NO.
-
-HIDE_UNDOC_MEMBERS     = NO
-
-# If the HIDE_UNDOC_CLASSES tag is set to YES, doxygen will hide all
-# undocumented classes that are normally visible in the class hierarchy. If set
-# to NO, these classes will be included in the various overviews. This option
-# has no effect if EXTRACT_ALL is enabled.
-# The default value is: NO.
-
-HIDE_UNDOC_CLASSES     = NO
-
-# If the HIDE_FRIEND_COMPOUNDS tag is set to YES, doxygen will hide all friend
-# (class|struct|union) declarations. If set to NO, these declarations will be
-# included in the documentation.
-# The default value is: NO.
-
-HIDE_FRIEND_COMPOUNDS  = NO
-
-# If the HIDE_IN_BODY_DOCS tag is set to YES, doxygen will hide any
-# documentation blocks found inside the body of a function. If set to NO, these
-# blocks will be appended to the function's detailed documentation block.
-# The default value is: NO.
-
-HIDE_IN_BODY_DOCS      = NO
-
-# The INTERNAL_DOCS tag determines if documentation that is typed after a
-# \internal command is included. If the tag is set to NO then the documentation
-# will be excluded. Set it to YES to include the internal documentation.
-# The default value is: NO.
-
-INTERNAL_DOCS          = NO
-
-# If the CASE_SENSE_NAMES tag is set to NO then doxygen will only generate file
-# names in lower-case letters. If set to YES, upper-case letters are also
-# allowed. This is useful if you have classes or files whose names only differ
-# in case and if your file system supports case sensitive file names. Windows
-# and Mac users are advised to set this option to NO.
-# The default value is: system dependent.
-
-CASE_SENSE_NAMES       = NO
-
-# If the HIDE_SCOPE_NAMES tag is set to NO then doxygen will show members with
-# their full class and namespace scopes in the documentation. If set to YES, the
-# scope will be hidden.
-# The default value is: NO.
-
-HIDE_SCOPE_NAMES       = NO
-
-# If the HIDE_COMPOUND_REFERENCE tag is set to NO (default) then doxygen will
-# append additional text to a page's title, such as Class Reference. If set to
-# YES the compound reference will be hidden.
-# The default value is: NO.
-
-HIDE_COMPOUND_REFERENCE= NO
-
-# If the SHOW_INCLUDE_FILES tag is set to YES then doxygen will put a list of
-# the files that are included by a file in the documentation of that file.
-# The default value is: YES.
-
-SHOW_INCLUDE_FILES     = YES
-
-# If the SHOW_GROUPED_MEMB_INC tag is set to YES then Doxygen will add for each
-# grouped member an include statement to the documentation, telling the reader
-# which file to include in order to use the member.
-# The default value is: NO.
-
-SHOW_GROUPED_MEMB_INC  = NO
-
-# If the FORCE_LOCAL_INCLUDES tag is set to YES then doxygen will list include
-# files with double quotes in the documentation rather than with sharp brackets.
-# The default value is: NO.
-
-FORCE_LOCAL_INCLUDES   = NO
-
-# If the INLINE_INFO tag is set to YES then a tag [inline] is inserted in the
-# documentation for inline members.
-# The default value is: YES.
-
-INLINE_INFO            = YES
-
-# If the SORT_MEMBER_DOCS tag is set to YES then doxygen will sort the
-# (detailed) documentation of file and class members alphabetically by member
-# name. If set to NO, the members will appear in declaration order.
-# The default value is: YES.
-
-SORT_MEMBER_DOCS       = YES
-
-# If the SORT_BRIEF_DOCS tag is set to YES then doxygen will sort the brief
-# descriptions of file, namespace and class members alphabetically by member
-# name. If set to NO, the members will appear in declaration order. Note that
-# this will also influence the order of the classes in the class list.
-# The default value is: NO.
-
-SORT_BRIEF_DOCS        = NO
-
-# If the SORT_MEMBERS_CTORS_1ST tag is set to YES then doxygen will sort the
-# (brief and detailed) documentation of class members so that constructors and
-# destructors are listed first. If set to NO the constructors will appear in the
-# respective orders defined by SORT_BRIEF_DOCS and SORT_MEMBER_DOCS.
-# Note: If SORT_BRIEF_DOCS is set to NO this option is ignored for sorting brief
-# member documentation.
-# Note: If SORT_MEMBER_DOCS is set to NO this option is ignored for sorting
-# detailed member documentation.
-# The default value is: NO.
-
-SORT_MEMBERS_CTORS_1ST = NO
-
-# If the SORT_GROUP_NAMES tag is set to YES then doxygen will sort the hierarchy
-# of group names into alphabetical order. If set to NO the group names will
-# appear in their defined order.
-# The default value is: NO.
-
-SORT_GROUP_NAMES       = NO
-
-# If the SORT_BY_SCOPE_NAME tag is set to YES, the class list will be sorted by
-# fully-qualified names, including namespaces. If set to NO, the class list will
-# be sorted only by class name, not including the namespace part.
-# Note: This option is not very useful if HIDE_SCOPE_NAMES is set to YES.
-# Note: This option applies only to the class list, not to the alphabetical
-# list.
-# The default value is: NO.
-
-SORT_BY_SCOPE_NAME     = NO
-
-# If the STRICT_PROTO_MATCHING option is enabled and doxygen fails to do proper
-# type resolution of all parameters of a function it will reject a match between
-# the prototype and the implementation of a member function even if there is
-# only one candidate or it is obvious which candidate to choose by doing a
-# simple string match. By disabling STRICT_PROTO_MATCHING doxygen will still
-# accept a match between prototype and implementation in such cases.
-# The default value is: NO.
-
-STRICT_PROTO_MATCHING  = NO
-
-# The GENERATE_TODOLIST tag can be used to enable (YES) or disable (NO) the todo
-# list. This list is created by putting \todo commands in the documentation.
-# The default value is: YES.
-
-GENERATE_TODOLIST      = YES
-
-# The GENERATE_TESTLIST tag can be used to enable (YES) or disable (NO) the test
-# list. This list is created by putting \test commands in the documentation.
-# The default value is: YES.
-
-GENERATE_TESTLIST      = YES
-
-# The GENERATE_BUGLIST tag can be used to enable (YES) or disable (NO) the bug
-# list. This list is created by putting \bug commands in the documentation.
-# The default value is: YES.
-
-GENERATE_BUGLIST       = YES
-
-# The GENERATE_DEPRECATEDLIST tag can be used to enable (YES) or disable (NO)
-# the deprecated list. This list is created by putting \deprecated commands in
-# the documentation.
-# The default value is: YES.
-
-GENERATE_DEPRECATEDLIST= YES
-
-# The ENABLED_SECTIONS tag can be used to enable conditional documentation
-# sections, marked by \if <section_label> ... \endif and \cond <section_label>
-# ... \endcond blocks.
-
-ENABLED_SECTIONS       =
-
-# The MAX_INITIALIZER_LINES tag determines the maximum number of lines that the
-# initial value of a variable or macro / define can have for it to appear in the
-# documentation. If the initializer consists of more lines than specified here
-# it will be hidden. Use a value of 0 to hide initializers completely. The
-# appearance of the value of individual variables and macros / defines can be
-# controlled using \showinitializer or \hideinitializer command in the
-# documentation regardless of this setting.
-# Minimum value: 0, maximum value: 10000, default value: 30.
-
-MAX_INITIALIZER_LINES  = 30
-
-# Set the SHOW_USED_FILES tag to NO to disable the list of files generated at
-# the bottom of the documentation of classes and structs. If set to YES, the
-# list will mention the files that were used to generate the documentation.
-# The default value is: YES.
-
-SHOW_USED_FILES        = YES
-
-# Set the SHOW_FILES tag to NO to disable the generation of the Files page. This
-# will remove the Files entry from the Quick Index and from the Folder Tree View
-# (if specified).
-# The default value is: YES.
-
-SHOW_FILES             = YES
-
-# Set the SHOW_NAMESPACES tag to NO to disable the generation of the Namespaces
-# page. This will remove the Namespaces entry from the Quick Index and from the
-# Folder Tree View (if specified).
-# The default value is: YES.
-
-SHOW_NAMESPACES        = YES
-
-# The FILE_VERSION_FILTER tag can be used to specify a program or script that
-# doxygen should invoke to get the current version for each file (typically from
-# the version control system). Doxygen will invoke the program by executing (via
-# popen()) the command command input-file, where command is the value of the
-# FILE_VERSION_FILTER tag, and input-file is the name of an input file provided
-# by doxygen. Whatever the program writes to standard output is used as the file
-# version. For an example see the documentation.
-
-FILE_VERSION_FILTER    =
-
-# The LAYOUT_FILE tag can be used to specify a layout file which will be parsed
-# by doxygen. The layout file controls the global structure of the generated
-# output files in an output format independent way. To create the layout file
-# that represents doxygen's defaults, run doxygen with the -l option. You can
-# optionally specify a file name after the option, if omitted DoxygenLayout.xml
-# will be used as the name of the layout file.
-#
-# Note that if you run doxygen from a directory containing a file called
-# DoxygenLayout.xml, doxygen will parse it automatically even if the LAYOUT_FILE
-# tag is left empty.
-
-LAYOUT_FILE            =
-
-# The CITE_BIB_FILES tag can be used to specify one or more bib files containing
-# the reference definitions. This must be a list of .bib files. The .bib
-# extension is automatically appended if omitted. This requires the bibtex tool
-# to be installed. See also http://en.wikipedia.org/wiki/BibTeX for more info.
-# For LaTeX the style of the bibliography can be controlled using
-# LATEX_BIB_STYLE. To use this feature you need bibtex and perl available in the
-# search path. See also \cite for info how to create references.
-
-CITE_BIB_FILES         =
-
-#---------------------------------------------------------------------------
-# Configuration options related to warning and progress messages
-#---------------------------------------------------------------------------
-
-# The QUIET tag can be used to turn on/off the messages that are generated to
-# standard output by doxygen. If QUIET is set to YES this implies that the
-# messages are off.
-# The default value is: NO.
-
-QUIET                  = NO
-
-# The WARNINGS tag can be used to turn on/off the warning messages that are
-# generated to standard error (stderr) by doxygen. If WARNINGS is set to YES
-# this implies that the warnings are on.
-#
-# Tip: Turn warnings on while writing the documentation.
-# The default value is: YES.
-
-WARNINGS               = YES
-
-# If the WARN_IF_UNDOCUMENTED tag is set to YES then doxygen will generate
-# warnings for undocumented members. If EXTRACT_ALL is set to YES then this flag
-# will automatically be disabled.
-# The default value is: YES.
-
-WARN_IF_UNDOCUMENTED   = YES
-
-# If the WARN_IF_DOC_ERROR tag is set to YES, doxygen will generate warnings for
-# potential errors in the documentation, such as not documenting some parameters
-# in a documented function, or documenting parameters that don't exist or using
-# markup commands wrongly.
-# The default value is: YES.
-
-WARN_IF_DOC_ERROR      = YES
-
-# This WARN_NO_PARAMDOC option can be enabled to get warnings for functions that
-# are documented, but have no documentation for their parameters or return
-# value. If set to NO, doxygen will only warn about wrong or incomplete
-# parameter documentation, but not about the absence of documentation.
-# The default value is: NO.
-
-WARN_NO_PARAMDOC       = NO
-
-# If the WARN_AS_ERROR tag is set to YES then doxygen will immediately stop when
-# a warning is encountered.
-# The default value is: NO.
-
-WARN_AS_ERROR          = NO
-
-# The WARN_FORMAT tag determines the format of the warning messages that doxygen
-# can produce. The string should contain the $file, $line, and $text tags, which
-# will be replaced by the file and line number from which the warning originated
-# and the warning text. Optionally the format may contain $version, which will
-# be replaced by the version of the file (if it could be obtained via
-# FILE_VERSION_FILTER)
-# The default value is: $file:$line: $text.
-
-WARN_FORMAT            = "$file:$line: $text"
-
-# The WARN_LOGFILE tag can be used to specify a file to which warning and error
-# messages should be written. If left blank the output is written to standard
-# error (stderr).
-
-WARN_LOGFILE           =
-
-#---------------------------------------------------------------------------
-# Configuration options related to the input files
-#---------------------------------------------------------------------------
-
-# The INPUT tag is used to specify the files and/or directories that contain
-# documented source files. You may enter file names like myfile.cpp or
-# directories like /usr/src/myproject. Separate the files or directories with
-# spaces. See also FILE_PATTERNS and EXTENSION_MAPPING
-# Note: If this tag is empty the current directory is searched.
-
-INPUT                  = ../src
-
-# This tag can be used to specify the character encoding of the source files
-# that doxygen parses. Internally doxygen uses the UTF-8 encoding. Doxygen uses
-# libiconv (or the iconv built into libc) for the transcoding. See the libiconv
-# documentation (see: http://www.gnu.org/software/libiconv) for the list of
-# possible encodings.
-# The default value is: UTF-8.
-
-INPUT_ENCODING         = UTF-8
-
-# If the value of the INPUT tag contains directories, you can use the
-# FILE_PATTERNS tag to specify one or more wildcard patterns (like *.cpp and
-# *.h) to filter out the source-files in the directories.
-#
-# Note that for custom extensions or not directly supported extensions you also
-# need to set EXTENSION_MAPPING for the extension otherwise the files are not
-# read by doxygen.
-#
-# If left blank the following patterns are tested:*.c, *.cc, *.cxx, *.cpp,
-# *.c++, *.java, *.ii, *.ixx, *.ipp, *.i++, *.inl, *.idl, *.ddl, *.odl, *.h,
-# *.hh, *.hxx, *.hpp, *.h++, *.cs, *.d, *.php, *.php4, *.php5, *.phtml, *.inc,
-# *.m, *.markdown, *.md, *.mm, *.dox, *.py, *.pyw, *.f90, *.f95, *.f03, *.f08,
-# *.f, *.for, *.tcl, *.vhd, *.vhdl, *.ucf and *.qsf.
-
-FILE_PATTERNS          = *.c \
-                         *.cc \
-                         *.cxx \
-                         *.cpp \
-                         *.c++ \
-                         *.java \
-                         *.ii \
-                         *.ixx \
-                         *.ipp \
-                         *.i++ \
-                         *.inl \
-                         *.idl \
-                         *.ddl \
-                         *.odl \
-                         *.h \
-                         *.hh \
-                         *.hxx \
-                         *.hpp \
-                         *.h++ \
-                         *.cs \
-                         *.d \
-                         *.php \
-                         *.php4 \
-                         *.php5 \
-                         *.phtml \
-                         *.inc \
-                         *.m \
-                         *.markdown \
-                         *.md \
-                         *.mm \
-                         *.dox \
-                         *.py \
-                         *.pyw \
-                         *.f90 \
-                         *.f95 \
-                         *.f03 \
-                         *.f08 \
-                         *.f \
-                         *.for \
-                         *.tcl \
-                         *.vhd \
-                         *.vhdl \
-                         *.ucf \
-                         *.qsf
-
-# The RECURSIVE tag can be used to specify whether or not subdirectories should
-# be searched for input files as well.
-# The default value is: NO.
-
-RECURSIVE              = NO
-
-# The EXCLUDE tag can be used to specify files and/or directories that should be
-# excluded from the INPUT source files. This way you can easily exclude a
-# subdirectory from a directory tree whose root is specified with the INPUT tag.
-#
-# Note that relative paths are relative to the directory from which doxygen is
-# run.
-
-EXCLUDE                = ../src/utarray.h ../src/uthash.h
-
-# The EXCLUDE_SYMLINKS tag can be used to select whether or not files or
-# directories that are symbolic links (a Unix file system feature) are excluded
-# from the input.
-# The default value is: NO.
-
-EXCLUDE_SYMLINKS       = NO
-
-# If the value of the INPUT tag contains directories, you can use the
-# EXCLUDE_PATTERNS tag to specify one or more wildcard patterns to exclude
-# certain files from those directories.
-#
-# Note that the wildcards are matched against the file with absolute path, so to
-# exclude all test directories for example use the pattern */test/*
-
-EXCLUDE_PATTERNS       =
-
-# The EXCLUDE_SYMBOLS tag can be used to specify one or more symbol names
-# (namespaces, classes, functions, etc.) that should be excluded from the
-# output. The symbol name can be a fully qualified name, a word, or if the
-# wildcard * is used, a substring. Examples: ANamespace, AClass,
-# AClass::ANamespace, ANamespace::*Test
-#
-# Note that the wildcards are matched against the file with absolute path, so to
-# exclude all test directories use the pattern */test/*
-
-EXCLUDE_SYMBOLS        =
-
-# The EXAMPLE_PATH tag can be used to specify one or more files or directories
-# that contain example code fragments that are included (see the \include
-# command).
-
-EXAMPLE_PATH           =
-
-# If the value of the EXAMPLE_PATH tag contains directories, you can use the
-# EXAMPLE_PATTERNS tag to specify one or more wildcard pattern (like *.cpp and
-# *.h) to filter out the source-files in the directories. If left blank all
-# files are included.
-
-EXAMPLE_PATTERNS       = *
-
-# If the EXAMPLE_RECURSIVE tag is set to YES then subdirectories will be
-# searched for input files to be used with the \include or \dontinclude commands
-# irrespective of the value of the RECURSIVE tag.
-# The default value is: NO.
-
-EXAMPLE_RECURSIVE      = NO
-
-# The IMAGE_PATH tag can be used to specify one or more files or directories
-# that contain images that are to be included in the documentation (see the
-# \image command).
-
-IMAGE_PATH             =
-
-# The INPUT_FILTER tag can be used to specify a program that doxygen should
-# invoke to filter for each input file. Doxygen will invoke the filter program
-# by executing (via popen()) the command:
-#
-# <filter> <input-file>
-#
-# where <filter> is the value of the INPUT_FILTER tag, and <input-file> is the
-# name of an input file. Doxygen will then use the output that the filter
-# program writes to standard output. If FILTER_PATTERNS is specified, this tag
-# will be ignored.
-#
-# Note that the filter must not add or remove lines; it is applied before the
-# code is scanned, but not when the output code is generated. If lines are added
-# or removed, the anchors will not be placed correctly.
-#
-# Note that for custom extensions or not directly supported extensions you also
-# need to set EXTENSION_MAPPING for the extension otherwise the files are not
-# properly processed by doxygen.
-
-INPUT_FILTER           =
-
-# The FILTER_PATTERNS tag can be used to specify filters on a per file pattern
-# basis. Doxygen will compare the file name with each pattern and apply the
-# filter if there is a match. The filters are a list of the form: pattern=filter
-# (like *.cpp=my_cpp_filter). See INPUT_FILTER for further information on how
-# filters are used. If the FILTER_PATTERNS tag is empty or if none of the
-# patterns match the file name, INPUT_FILTER is applied.
-#
-# Note that for custom extensions or not directly supported extensions you also
-# need to set EXTENSION_MAPPING for the extension otherwise the files are not
-# properly processed by doxygen.
-
-FILTER_PATTERNS        =
-
-# If the FILTER_SOURCE_FILES tag is set to YES, the input filter (if set using
-# INPUT_FILTER) will also be used to filter the input files that are used for
-# producing the source files to browse (i.e. when SOURCE_BROWSER is set to YES).
-# The default value is: NO.
-
-FILTER_SOURCE_FILES    = NO
-
-# The FILTER_SOURCE_PATTERNS tag can be used to specify source filters per file
-# pattern. A pattern will override the setting for FILTER_PATTERN (if any) and
-# it is also possible to disable source filtering for a specific pattern using
-# *.ext= (so without naming a filter).
-# This tag requires that the tag FILTER_SOURCE_FILES is set to YES.
-
-FILTER_SOURCE_PATTERNS =
-
-# If the USE_MDFILE_AS_MAINPAGE tag refers to the name of a markdown file that
-# is part of the input, its contents will be placed on the main page
-# (index.html). This can be useful if you have a project on for instance GitHub
-# and want to reuse the introduction page also for the doxygen output.
-
-USE_MDFILE_AS_MAINPAGE =
-
-#---------------------------------------------------------------------------
-# Configuration options related to source browsing
-#---------------------------------------------------------------------------
-
-# If the SOURCE_BROWSER tag is set to YES then a list of source files will be
-# generated. Documented entities will be cross-referenced with these sources.
-#
-# Note: To get rid of all source code in the generated output, make sure that
-# also VERBATIM_HEADERS is set to NO.
-# The default value is: NO.
-
-SOURCE_BROWSER         = NO
-
-# Setting the INLINE_SOURCES tag to YES will include the body of functions,
-# classes and enums directly into the documentation.
-# The default value is: NO.
-
-INLINE_SOURCES         = NO
-
-# Setting the STRIP_CODE_COMMENTS tag to YES will instruct doxygen to hide any
-# special comment blocks from generated source code fragments. Normal C, C++ and
-# Fortran comments will always remain visible.
-# The default value is: YES.
-
-STRIP_CODE_COMMENTS    = YES
-
-# If the REFERENCED_BY_RELATION tag is set to YES then for each documented
-# function all documented functions referencing it will be listed.
-# The default value is: NO.
-
-REFERENCED_BY_RELATION = NO
-
-# If the REFERENCES_RELATION tag is set to YES then for each documented function
-# all documented entities called/used by that function will be listed.
-# The default value is: NO.
-
-REFERENCES_RELATION    = NO
-
-# If the REFERENCES_LINK_SOURCE tag is set to YES and SOURCE_BROWSER tag is set
-# to YES then the hyperlinks from functions in REFERENCES_RELATION and
-# REFERENCED_BY_RELATION lists will link to the source code. Otherwise they will
-# link to the documentation.
-# The default value is: YES.
-
-REFERENCES_LINK_SOURCE = YES
-
-# If SOURCE_TOOLTIPS is enabled (the default) then hovering a hyperlink in the
-# source code will show a tooltip with additional information such as prototype,
-# brief description and links to the definition and documentation. Since this
-# will make the HTML file larger and loading of large files a bit slower, you
-# can opt to disable this feature.
-# The default value is: YES.
-# This tag requires that the tag SOURCE_BROWSER is set to YES.
-
-SOURCE_TOOLTIPS        = YES
-
-# If the USE_HTAGS tag is set to YES then the references to source code will
-# point to the HTML generated by the htags(1) tool instead of doxygen built-in
-# source browser. The htags tool is part of GNU's global source tagging system
-# (see http://www.gnu.org/software/global/global.html). You will need version
-# 4.8.6 or higher.
-#
-# To use it do the following:
-# - Install the latest version of global
-# - Enable SOURCE_BROWSER and USE_HTAGS in the config file
-# - Make sure the INPUT points to the root of the source tree
-# - Run doxygen as normal
-#
-# Doxygen will invoke htags (and that will in turn invoke gtags), so these
-# tools must be available from the command line (i.e. in the search path).
-#
-# The result: instead of the source browser generated by doxygen, the links to
-# source code will now point to the output of htags.
-# The default value is: NO.
-# This tag requires that the tag SOURCE_BROWSER is set to YES.
-
-USE_HTAGS              = NO
-
-# If the VERBATIM_HEADERS tag is set the YES then doxygen will generate a
-# verbatim copy of the header file for each class for which an include is
-# specified. Set to NO to disable this.
-# See also: Section \class.
-# The default value is: YES.
-
-VERBATIM_HEADERS       = YES
-
-#---------------------------------------------------------------------------
-# Configuration options related to the alphabetical class index
-#---------------------------------------------------------------------------
-
-# If the ALPHABETICAL_INDEX tag is set to YES, an alphabetical index of all
-# compounds will be generated. Enable this if the project contains a lot of
-# classes, structs, unions or interfaces.
-# The default value is: YES.
-
-ALPHABETICAL_INDEX     = YES
-
-# The COLS_IN_ALPHA_INDEX tag can be used to specify the number of columns in
-# which the alphabetical index list will be split.
-# Minimum value: 1, maximum value: 20, default value: 5.
-# This tag requires that the tag ALPHABETICAL_INDEX is set to YES.
-
-COLS_IN_ALPHA_INDEX    = 5
-
-# In case all classes in a project start with a common prefix, all classes will
-# be put under the same header in the alphabetical index. The IGNORE_PREFIX tag
-# can be used to specify a prefix (or a list of prefixes) that should be ignored
-# while generating the index headers.
-# This tag requires that the tag ALPHABETICAL_INDEX is set to YES.
-
-IGNORE_PREFIX          =
-
-#---------------------------------------------------------------------------
-# Configuration options related to the HTML output
-#---------------------------------------------------------------------------
-
-# If the GENERATE_HTML tag is set to YES, doxygen will generate HTML output
-# The default value is: YES.
-
-GENERATE_HTML          = YES
-
-# The HTML_OUTPUT tag is used to specify where the HTML docs will be put. If a
-# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
-# it.
-# The default directory is: html.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_OUTPUT            = html
-
-# The HTML_FILE_EXTENSION tag can be used to specify the file extension for each
-# generated HTML page (for example: .htm, .php, .asp).
-# The default value is: .html.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_FILE_EXTENSION    = .html
-
-# The HTML_HEADER tag can be used to specify a user-defined HTML header file for
-# each generated HTML page. If the tag is left blank doxygen will generate a
-# standard header.
-#
-# To get valid HTML the header file that includes any scripts and style sheets
-# that doxygen needs, which is dependent on the configuration options used (e.g.
-# the setting GENERATE_TREEVIEW). It is highly recommended to start with a
-# default header using
-# doxygen -w html new_header.html new_footer.html new_stylesheet.css
-# YourConfigFile
-# and then modify the file new_header.html. See also section "Doxygen usage"
-# for information on how to generate the default header that doxygen normally
-# uses.
-# Note: The header is subject to change so you typically have to regenerate the
-# default header when upgrading to a newer version of doxygen. For a description
-# of the possible markers and block names see the documentation.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_HEADER            =
-
-# The HTML_FOOTER tag can be used to specify a user-defined HTML footer for each
-# generated HTML page. If the tag is left blank doxygen will generate a standard
-# footer. See HTML_HEADER for more information on how to generate a default
-# footer and what special commands can be used inside the footer. See also
-# section "Doxygen usage" for information on how to generate the default footer
-# that doxygen normally uses.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_FOOTER            =
-
-# The HTML_STYLESHEET tag can be used to specify a user-defined cascading style
-# sheet that is used by each HTML page. It can be used to fine-tune the look of
-# the HTML output. If left blank doxygen will generate a default style sheet.
-# See also section "Doxygen usage" for information on how to generate the style
-# sheet that doxygen normally uses.
-# Note: It is recommended to use HTML_EXTRA_STYLESHEET instead of this tag, as
-# it is more robust and this tag (HTML_STYLESHEET) will in the future become
-# obsolete.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_STYLESHEET        =
-
-# The HTML_EXTRA_STYLESHEET tag can be used to specify additional user-defined
-# cascading style sheets that are included after the standard style sheets
-# created by doxygen. Using this option one can overrule certain style aspects.
-# This is preferred over using HTML_STYLESHEET since it does not replace the
-# standard style sheet and is therefore more robust against future updates.
-# Doxygen will copy the style sheet files to the output directory.
-# Note: The order of the extra style sheet files is of importance (e.g. the last
-# style sheet in the list overrules the setting of the previous ones in the
-# list). For an example see the documentation.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_EXTRA_STYLESHEET  =
-
-# The HTML_EXTRA_FILES tag can be used to specify one or more extra images or
-# other source files which should be copied to the HTML output directory. Note
-# that these files will be copied to the base HTML output directory. Use the
-# $relpath^ marker in the HTML_HEADER and/or HTML_FOOTER files to load these
-# files. In the HTML_STYLESHEET file, use the file name only. Also note that the
-# files will be copied as-is; there are no commands or markers available.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_EXTRA_FILES       =
-
-# The HTML_COLORSTYLE_HUE tag controls the color of the HTML output. Doxygen
-# will adjust the colors in the style sheet and background images according to
-# this color. Hue is specified as an angle on a colorwheel, see
-# http://en.wikipedia.org/wiki/Hue for more information. For instance the value
-# 0 represents red, 60 is yellow, 120 is green, 180 is cyan, 240 is blue, 300
-# purple, and 360 is red again.
-# Minimum value: 0, maximum value: 359, default value: 220.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_COLORSTYLE_HUE    = 220
-
-# The HTML_COLORSTYLE_SAT tag controls the purity (or saturation) of the colors
-# in the HTML output. For a value of 0 the output will use grayscales only. A
-# value of 255 will produce the most vivid colors.
-# Minimum value: 0, maximum value: 255, default value: 100.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_COLORSTYLE_SAT    = 100
-
-# The HTML_COLORSTYLE_GAMMA tag controls the gamma correction applied to the
-# luminance component of the colors in the HTML output. Values below 100
-# gradually make the output lighter, whereas values above 100 make the output
-# darker. The value divided by 100 is the actual gamma applied, so 80 represents
-# a gamma of 0.8, The value 220 represents a gamma of 2.2, and 100 does not
-# change the gamma.
-# Minimum value: 40, maximum value: 240, default value: 80.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_COLORSTYLE_GAMMA  = 80
-
-# If the HTML_TIMESTAMP tag is set to YES then the footer of each generated HTML
-# page will contain the date and time when the page was generated. Setting this
-# to YES can help to show when doxygen was last run and thus if the
-# documentation is up to date.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_TIMESTAMP         = NO
-
-# If the HTML_DYNAMIC_SECTIONS tag is set to YES then the generated HTML
-# documentation will contain sections that can be hidden and shown after the
-# page has loaded.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_DYNAMIC_SECTIONS  = NO
-
-# With HTML_INDEX_NUM_ENTRIES one can control the preferred number of entries
-# shown in the various tree structured indices initially; the user can expand
-# and collapse entries dynamically later on. Doxygen will expand the tree to
-# such a level that at most the specified number of entries are visible (unless
-# a fully collapsed tree already exceeds this amount). So setting the number of
-# entries 1 will produce a full collapsed tree by default. 0 is a special value
-# representing an infinite number of entries and will result in a full expanded
-# tree by default.
-# Minimum value: 0, maximum value: 9999, default value: 100.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-HTML_INDEX_NUM_ENTRIES = 100
-
-# If the GENERATE_DOCSET tag is set to YES, additional index files will be
-# generated that can be used as input for Apple's Xcode 3 integrated development
-# environment (see: http://developer.apple.com/tools/xcode/), introduced with
-# OSX 10.5 (Leopard). To create a documentation set, doxygen will generate a
-# Makefile in the HTML output directory. Running make will produce the docset in
-# that directory and running make install will install the docset in
-# ~/Library/Developer/Shared/Documentation/DocSets so that Xcode will find it at
-# startup. See http://developer.apple.com/tools/creatingdocsetswithdoxygen.html
-# for more information.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-GENERATE_DOCSET        = NO
-
-# This tag determines the name of the docset feed. A documentation feed provides
-# an umbrella under which multiple documentation sets from a single provider
-# (such as a company or product suite) can be grouped.
-# The default value is: Doxygen generated docs.
-# This tag requires that the tag GENERATE_DOCSET is set to YES.
-
-DOCSET_FEEDNAME        = "Doxygen generated docs"
-
-# This tag specifies a string that should uniquely identify the documentation
-# set bundle. This should be a reverse domain-name style string, e.g.
-# com.mycompany.MyDocSet. Doxygen will append .docset to the name.
-# The default value is: org.doxygen.Project.
-# This tag requires that the tag GENERATE_DOCSET is set to YES.
-
-DOCSET_BUNDLE_ID       = org.doxygen.Project
-
-# The DOCSET_PUBLISHER_ID tag specifies a string that should uniquely identify
-# the documentation publisher. This should be a reverse domain-name style
-# string, e.g. com.mycompany.MyDocSet.documentation.
-# The default value is: org.doxygen.Publisher.
-# This tag requires that the tag GENERATE_DOCSET is set to YES.
-
-DOCSET_PUBLISHER_ID    = org.doxygen.Publisher
-
-# The DOCSET_PUBLISHER_NAME tag identifies the documentation publisher.
-# The default value is: Publisher.
-# This tag requires that the tag GENERATE_DOCSET is set to YES.
-
-DOCSET_PUBLISHER_NAME  = Publisher
-
-# If the GENERATE_HTMLHELP tag is set to YES then doxygen generates three
-# additional HTML index files: index.hhp, index.hhc, and index.hhk. The
-# index.hhp is a project file that can be read by Microsoft's HTML Help Workshop
-# (see: http://www.microsoft.com/en-us/download/details.aspx?id=21138) on
-# Windows.
-#
-# The HTML Help Workshop contains a compiler that can convert all HTML output
-# generated by doxygen into a single compiled HTML file (.chm). Compiled HTML
-# files are now used as the Windows 98 help format, and will replace the old
-# Windows help format (.hlp) on all Windows platforms in the future. Compressed
-# HTML files also contain an index, a table of contents, and you can search for
-# words in the documentation. The HTML workshop also contains a viewer for
-# compressed HTML files.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-GENERATE_HTMLHELP      = NO
-
-# The CHM_FILE tag can be used to specify the file name of the resulting .chm
-# file. You can add a path in front of the file if the result should not be
-# written to the html output directory.
-# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
-
-CHM_FILE               =
-
-# The HHC_LOCATION tag can be used to specify the location (absolute path
-# including file name) of the HTML help compiler (hhc.exe). If non-empty,
-# doxygen will try to run the HTML help compiler on the generated index.hhp.
-# The file has to be specified with full path.
-# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
-
-HHC_LOCATION           =
-
-# The GENERATE_CHI flag controls if a separate .chi index file is generated
-# (YES) or that it should be included in the master .chm file (NO).
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
-
-GENERATE_CHI           = NO
-
-# The CHM_INDEX_ENCODING is used to encode HtmlHelp index (hhk), content (hhc)
-# and project file content.
-# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
-
-CHM_INDEX_ENCODING     =
-
-# The BINARY_TOC flag controls whether a binary table of contents is generated
-# (YES) or a normal table of contents (NO) in the .chm file. Furthermore it
-# enables the Previous and Next buttons.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
-
-BINARY_TOC             = NO
-
-# The TOC_EXPAND flag can be set to YES to add extra items for group members to
-# the table of contents of the HTML help documentation and to the tree view.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
-
-TOC_EXPAND             = NO
-
-# If the GENERATE_QHP tag is set to YES and both QHP_NAMESPACE and
-# QHP_VIRTUAL_FOLDER are set, an additional index file will be generated that
-# can be used as input for Qt's qhelpgenerator to generate a Qt Compressed Help
-# (.qch) of the generated HTML documentation.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-GENERATE_QHP           = NO
-
-# If the QHG_LOCATION tag is specified, the QCH_FILE tag can be used to specify
-# the file name of the resulting .qch file. The path specified is relative to
-# the HTML output folder.
-# This tag requires that the tag GENERATE_QHP is set to YES.
-
-QCH_FILE               =
-
-# The QHP_NAMESPACE tag specifies the namespace to use when generating Qt Help
-# Project output. For more information please see Qt Help Project / Namespace
-# (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#namespace).
-# The default value is: org.doxygen.Project.
-# This tag requires that the tag GENERATE_QHP is set to YES.
-
-QHP_NAMESPACE          = org.doxygen.Project
-
-# The QHP_VIRTUAL_FOLDER tag specifies the namespace to use when generating Qt
-# Help Project output. For more information please see Qt Help Project / Virtual
-# Folders (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#virtual-
-# folders).
-# The default value is: doc.
-# This tag requires that the tag GENERATE_QHP is set to YES.
-
-QHP_VIRTUAL_FOLDER     = doc
-
-# If the QHP_CUST_FILTER_NAME tag is set, it specifies the name of a custom
-# filter to add. For more information please see Qt Help Project / Custom
-# Filters (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#custom-
-# filters).
-# This tag requires that the tag GENERATE_QHP is set to YES.
-
-QHP_CUST_FILTER_NAME   =
-
-# The QHP_CUST_FILTER_ATTRS tag specifies the list of the attributes of the
-# custom filter to add. For more information please see Qt Help Project / Custom
-# Filters (see: http://qt-project.org/doc/qt-4.8/qthelpproject.html#custom-
-# filters).
-# This tag requires that the tag GENERATE_QHP is set to YES.
-
-QHP_CUST_FILTER_ATTRS  =
-
-# The QHP_SECT_FILTER_ATTRS tag specifies the list of the attributes this
-# project's filter section matches. Qt Help Project / Filter Attributes (see:
-# http://qt-project.org/doc/qt-4.8/qthelpproject.html#filter-attributes).
-# This tag requires that the tag GENERATE_QHP is set to YES.
-
-QHP_SECT_FILTER_ATTRS  =
-
-# The QHG_LOCATION tag can be used to specify the location of Qt's
-# qhelpgenerator. If non-empty doxygen will try to run qhelpgenerator on the
-# generated .qhp file.
-# This tag requires that the tag GENERATE_QHP is set to YES.
-
-QHG_LOCATION           =
-
-# If the GENERATE_ECLIPSEHELP tag is set to YES, additional index files will be
-# generated, together with the HTML files, they form an Eclipse help plugin. To
-# install this plugin and make it available under the help contents menu in
-# Eclipse, the contents of the directory containing the HTML and XML files needs
-# to be copied into the plugins directory of eclipse. The name of the directory
-# within the plugins directory should be the same as the ECLIPSE_DOC_ID value.
-# After copying Eclipse needs to be restarted before the help appears.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-GENERATE_ECLIPSEHELP   = NO
-
-# A unique identifier for the Eclipse help plugin. When installing the plugin
-# the directory name containing the HTML and XML files should also have this
-# name. Each documentation set should have its own identifier.
-# The default value is: org.doxygen.Project.
-# This tag requires that the tag GENERATE_ECLIPSEHELP is set to YES.
-
-ECLIPSE_DOC_ID         = org.doxygen.Project
-
-# If you want full control over the layout of the generated HTML pages it might
-# be necessary to disable the index and replace it with your own. The
-# DISABLE_INDEX tag can be used to turn on/off the condensed index (tabs) at top
-# of each HTML page. A value of NO enables the index and the value YES disables
-# it. Since the tabs in the index contain the same information as the navigation
-# tree, you can set this option to YES if you also set GENERATE_TREEVIEW to YES.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-DISABLE_INDEX          = NO
-
-# The GENERATE_TREEVIEW tag is used to specify whether a tree-like index
-# structure should be generated to display hierarchical information. If the tag
-# value is set to YES, a side panel will be generated containing a tree-like
-# index structure (just like the one that is generated for HTML Help). For this
-# to work a browser that supports JavaScript, DHTML, CSS and frames is required
-# (i.e. any modern browser). Windows users are probably better off using the
-# HTML help feature. Via custom style sheets (see HTML_EXTRA_STYLESHEET) one can
-# further fine-tune the look of the index. As an example, the default style
-# sheet generated by doxygen has an example that shows how to put an image at
-# the root of the tree instead of the PROJECT_NAME. Since the tree basically has
-# the same information as the tab index, you could consider setting
-# DISABLE_INDEX to YES when enabling this option.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-GENERATE_TREEVIEW      = NO
-
-# The ENUM_VALUES_PER_LINE tag can be used to set the number of enum values that
-# doxygen will group on one line in the generated HTML documentation.
-#
-# Note that a value of 0 will completely suppress the enum values from appearing
-# in the overview section.
-# Minimum value: 0, maximum value: 20, default value: 4.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-ENUM_VALUES_PER_LINE   = 4
-
-# If the treeview is enabled (see GENERATE_TREEVIEW) then this tag can be used
-# to set the initial width (in pixels) of the frame in which the tree is shown.
-# Minimum value: 0, maximum value: 1500, default value: 250.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-TREEVIEW_WIDTH         = 250
-
-# If the EXT_LINKS_IN_WINDOW option is set to YES, doxygen will open links to
-# external symbols imported via tag files in a separate window.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-EXT_LINKS_IN_WINDOW    = NO
-
-# Use this tag to change the font size of LaTeX formulas included as images in
-# the HTML documentation. When you change the font size after a successful
-# doxygen run you need to manually remove any form_*.png images from the HTML
-# output directory to force them to be regenerated.
-# Minimum value: 8, maximum value: 50, default value: 10.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-FORMULA_FONTSIZE       = 10
-
-# Use the FORMULA_TRANPARENT tag to determine whether or not the images
-# generated for formulas are transparent PNGs. Transparent PNGs are not
-# supported properly for IE 6.0, but are supported on all modern browsers.
-#
-# Note that when changing this option you need to delete any form_*.png files in
-# the HTML output directory before the changes have effect.
-# The default value is: YES.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-FORMULA_TRANSPARENT    = YES
-
-# Enable the USE_MATHJAX option to render LaTeX formulas using MathJax (see
-# http://www.mathjax.org) which uses client side Javascript for the rendering
-# instead of using pre-rendered bitmaps. Use this if you do not have LaTeX
-# installed or if you want to formulas look prettier in the HTML output. When
-# enabled you may also need to install MathJax separately and configure the path
-# to it using the MATHJAX_RELPATH option.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-USE_MATHJAX            = NO
-
-# When MathJax is enabled you can set the default output format to be used for
-# the MathJax output. See the MathJax site (see:
-# http://docs.mathjax.org/en/latest/output.html) for more details.
-# Possible values are: HTML-CSS (which is slower, but has the best
-# compatibility), NativeMML (i.e. MathML) and SVG.
-# The default value is: HTML-CSS.
-# This tag requires that the tag USE_MATHJAX is set to YES.
-
-MATHJAX_FORMAT         = HTML-CSS
-
-# When MathJax is enabled you need to specify the location relative to the HTML
-# output directory using the MATHJAX_RELPATH option. The destination directory
-# should contain the MathJax.js script. For instance, if the mathjax directory
-# is located at the same level as the HTML output directory, then
-# MATHJAX_RELPATH should be ../mathjax. The default value points to the MathJax
-# Content Delivery Network so you can quickly see the result without installing
-# MathJax. However, it is strongly recommended to install a local copy of
-# MathJax from http://www.mathjax.org before deployment.
-# The default value is: http://cdn.mathjax.org/mathjax/latest.
-# This tag requires that the tag USE_MATHJAX is set to YES.
-
-MATHJAX_RELPATH        = http://cdn.mathjax.org/mathjax/latest
-
-# The MATHJAX_EXTENSIONS tag can be used to specify one or more MathJax
-# extension names that should be enabled during MathJax rendering. For example
-# MATHJAX_EXTENSIONS = TeX/AMSmath TeX/AMSsymbols
-# This tag requires that the tag USE_MATHJAX is set to YES.
-
-MATHJAX_EXTENSIONS     =
-
-# The MATHJAX_CODEFILE tag can be used to specify a file with javascript pieces
-# of code that will be used on startup of the MathJax code. See the MathJax site
-# (see: http://docs.mathjax.org/en/latest/output.html) for more details. For an
-# example see the documentation.
-# This tag requires that the tag USE_MATHJAX is set to YES.
-
-MATHJAX_CODEFILE       =
-
-# When the SEARCHENGINE tag is enabled doxygen will generate a search box for
-# the HTML output. The underlying search engine uses javascript and DHTML and
-# should work on any modern browser. Note that when using HTML help
-# (GENERATE_HTMLHELP), Qt help (GENERATE_QHP), or docsets (GENERATE_DOCSET)
-# there is already a search function so this one should typically be disabled.
-# For large projects the javascript based search engine can be slow, then
-# enabling SERVER_BASED_SEARCH may provide a better solution. It is possible to
-# search using the keyboard; to jump to the search box use <access key> + S
-# (what the <access key> is depends on the OS and browser, but it is typically
-# <CTRL>, <ALT>/<option>, or both). Inside the search box use the <cursor down
-# key> to jump into the search results window, the results can be navigated
-# using the <cursor keys>. Press <Enter> to select an item or <escape> to cancel
-# the search. The filter options can be selected when the cursor is inside the
-# search box by pressing <Shift>+<cursor down>. Also here use the <cursor keys>
-# to select a filter and <Enter> or <escape> to activate or cancel the filter
-# option.
-# The default value is: YES.
-# This tag requires that the tag GENERATE_HTML is set to YES.
-
-SEARCHENGINE           = YES
-
-# When the SERVER_BASED_SEARCH tag is enabled the search engine will be
-# implemented using a web server instead of a web client using Javascript. There
-# are two flavors of web server based searching depending on the EXTERNAL_SEARCH
-# setting. When disabled, doxygen will generate a PHP script for searching and
-# an index file used by the script. When EXTERNAL_SEARCH is enabled the indexing
-# and searching needs to be provided by external tools. See the section
-# "External Indexing and Searching" for details.
-# The default value is: NO.
-# This tag requires that the tag SEARCHENGINE is set to YES.
-
-SERVER_BASED_SEARCH    = NO
-
-# When EXTERNAL_SEARCH tag is enabled doxygen will no longer generate the PHP
-# script for searching. Instead the search results are written to an XML file
-# which needs to be processed by an external indexer. Doxygen will invoke an
-# external search engine pointed to by the SEARCHENGINE_URL option to obtain the
-# search results.
-#
-# Doxygen ships with an example indexer (doxyindexer) and search engine
-# (doxysearch.cgi) which are based on the open source search engine library
-# Xapian (see: http://xapian.org/).
-#
-# See the section "External Indexing and Searching" for details.
-# The default value is: NO.
-# This tag requires that the tag SEARCHENGINE is set to YES.
-
-EXTERNAL_SEARCH        = NO
-
-# The SEARCHENGINE_URL should point to a search engine hosted by a web server
-# which will return the search results when EXTERNAL_SEARCH is enabled.
-#
-# Doxygen ships with an example indexer (doxyindexer) and search engine
-# (doxysearch.cgi) which are based on the open source search engine library
-# Xapian (see: http://xapian.org/). See the section "External Indexing and
-# Searching" for details.
-# This tag requires that the tag SEARCHENGINE is set to YES.
-
-SEARCHENGINE_URL       =
-
-# When SERVER_BASED_SEARCH and EXTERNAL_SEARCH are both enabled the unindexed
-# search data is written to a file for indexing by an external tool. With the
-# SEARCHDATA_FILE tag the name of this file can be specified.
-# The default file is: searchdata.xml.
-# This tag requires that the tag SEARCHENGINE is set to YES.
-
-SEARCHDATA_FILE        = searchdata.xml
-
-# When SERVER_BASED_SEARCH and EXTERNAL_SEARCH are both enabled the
-# EXTERNAL_SEARCH_ID tag can be used as an identifier for the project. This is
-# useful in combination with EXTRA_SEARCH_MAPPINGS to search through multiple
-# projects and redirect the results back to the right project.
-# This tag requires that the tag SEARCHENGINE is set to YES.
-
-EXTERNAL_SEARCH_ID     =
-
-# The EXTRA_SEARCH_MAPPINGS tag can be used to enable searching through doxygen
-# projects other than the one defined by this configuration file, but that are
-# all added to the same external search index. Each project needs to have a
-# unique id set via EXTERNAL_SEARCH_ID. The search mapping then maps the id of
-# to a relative location where the documentation can be found. The format is:
-# EXTRA_SEARCH_MAPPINGS = tagname1=loc1 tagname2=loc2 ...
-# This tag requires that the tag SEARCHENGINE is set to YES.
-
-EXTRA_SEARCH_MAPPINGS  =
-
-#---------------------------------------------------------------------------
-# Configuration options related to the LaTeX output
-#---------------------------------------------------------------------------
-
-# If the GENERATE_LATEX tag is set to YES, doxygen will generate LaTeX output.
-# The default value is: YES.
-
-GENERATE_LATEX         = YES
-
-# The LATEX_OUTPUT tag is used to specify where the LaTeX docs will be put. If a
-# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
-# it.
-# The default directory is: latex.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-LATEX_OUTPUT           = latex
-
-# The LATEX_CMD_NAME tag can be used to specify the LaTeX command name to be
-# invoked.
-#
-# Note that when enabling USE_PDFLATEX this option is only used for generating
-# bitmaps for formulas in the HTML output, but not in the Makefile that is
-# written to the output directory.
-# The default file is: latex.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-LATEX_CMD_NAME         = latex
-
-# The MAKEINDEX_CMD_NAME tag can be used to specify the command name to generate
-# index for LaTeX.
-# The default file is: makeindex.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-MAKEINDEX_CMD_NAME     = makeindex
-
-# If the COMPACT_LATEX tag is set to YES, doxygen generates more compact LaTeX
-# documents. This may be useful for small projects and may help to save some
-# trees in general.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-COMPACT_LATEX          = NO
-
-# The PAPER_TYPE tag can be used to set the paper type that is used by the
-# printer.
-# Possible values are: a4 (210 x 297 mm), letter (8.5 x 11 inches), legal (8.5 x
-# 14 inches) and executive (7.25 x 10.5 inches).
-# The default value is: a4.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-PAPER_TYPE             = a4
-
-# The EXTRA_PACKAGES tag can be used to specify one or more LaTeX package names
-# that should be included in the LaTeX output. The package can be specified just
-# by its name or with the correct syntax as to be used with the LaTeX
-# \usepackage command. To get the times font for instance you can specify :
-# EXTRA_PACKAGES=times or EXTRA_PACKAGES={times}
-# To use the option intlimits with the amsmath package you can specify:
-# EXTRA_PACKAGES=[intlimits]{amsmath}
-# If left blank no extra packages will be included.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-EXTRA_PACKAGES         =
-
-# The LATEX_HEADER tag can be used to specify a personal LaTeX header for the
-# generated LaTeX document. The header should contain everything until the first
-# chapter. If it is left blank doxygen will generate a standard header. See
-# section "Doxygen usage" for information on how to let doxygen write the
-# default header to a separate file.
-#
-# Note: Only use a user-defined header if you know what you are doing! The
-# following commands have a special meaning inside the header: $title,
-# $datetime, $date, $doxygenversion, $projectname, $projectnumber,
-# $projectbrief, $projectlogo. Doxygen will replace $title with the empty
-# string, for the replacement values of the other commands the user is referred
-# to HTML_HEADER.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-LATEX_HEADER           =
-
-# The LATEX_FOOTER tag can be used to specify a personal LaTeX footer for the
-# generated LaTeX document. The footer should contain everything after the last
-# chapter. If it is left blank doxygen will generate a standard footer. See
-# LATEX_HEADER for more information on how to generate a default footer and what
-# special commands can be used inside the footer.
-#
-# Note: Only use a user-defined footer if you know what you are doing!
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-LATEX_FOOTER           =
-
-# The LATEX_EXTRA_STYLESHEET tag can be used to specify additional user-defined
-# LaTeX style sheets that are included after the standard style sheets created
-# by doxygen. Using this option one can overrule certain style aspects. Doxygen
-# will copy the style sheet files to the output directory.
-# Note: The order of the extra style sheet files is of importance (e.g. the last
-# style sheet in the list overrules the setting of the previous ones in the
-# list).
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-LATEX_EXTRA_STYLESHEET =
-
-# The LATEX_EXTRA_FILES tag can be used to specify one or more extra images or
-# other source files which should be copied to the LATEX_OUTPUT output
-# directory. Note that the files will be copied as-is; there are no commands or
-# markers available.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-LATEX_EXTRA_FILES      =
-
-# If the PDF_HYPERLINKS tag is set to YES, the LaTeX that is generated is
-# prepared for conversion to PDF (using ps2pdf or pdflatex). The PDF file will
-# contain links (just like the HTML output) instead of page references. This
-# makes the output suitable for online browsing using a PDF viewer.
-# The default value is: YES.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-PDF_HYPERLINKS         = YES
-
-# If the USE_PDFLATEX tag is set to YES, doxygen will use pdflatex to generate
-# the PDF file directly from the LaTeX files. Set this option to YES, to get a
-# higher quality PDF documentation.
-# The default value is: YES.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-USE_PDFLATEX           = YES
-
-# If the LATEX_BATCHMODE tag is set to YES, doxygen will add the \batchmode
-# command to the generated LaTeX files. This will instruct LaTeX to keep running
-# if errors occur, instead of asking the user for help. This option is also used
-# when generating formulas in HTML.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-LATEX_BATCHMODE        = NO
-
-# If the LATEX_HIDE_INDICES tag is set to YES then doxygen will not include the
-# index chapters (such as File Index, Compound Index, etc.) in the output.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-LATEX_HIDE_INDICES     = NO
-
-# If the LATEX_SOURCE_CODE tag is set to YES then doxygen will include source
-# code with syntax highlighting in the LaTeX output.
-#
-# Note that which sources are shown also depends on other settings such as
-# SOURCE_BROWSER.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-LATEX_SOURCE_CODE      = NO
-
-# The LATEX_BIB_STYLE tag can be used to specify the style to use for the
-# bibliography, e.g. plainnat, or ieeetr. See
-# http://en.wikipedia.org/wiki/BibTeX and \cite for more info.
-# The default value is: plain.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-LATEX_BIB_STYLE        = plain
-
-# If the LATEX_TIMESTAMP tag is set to YES then the footer of each generated
-# page will contain the date and time when the page was generated. Setting this
-# to NO can help when comparing the output of multiple runs.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_LATEX is set to YES.
-
-LATEX_TIMESTAMP        = NO
-
-#---------------------------------------------------------------------------
-# Configuration options related to the RTF output
-#---------------------------------------------------------------------------
-
-# If the GENERATE_RTF tag is set to YES, doxygen will generate RTF output. The
-# RTF output is optimized for Word 97 and may not look too pretty with other RTF
-# readers/editors.
-# The default value is: NO.
-
-GENERATE_RTF           = NO
-
-# The RTF_OUTPUT tag is used to specify where the RTF docs will be put. If a
-# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
-# it.
-# The default directory is: rtf.
-# This tag requires that the tag GENERATE_RTF is set to YES.
-
-RTF_OUTPUT             = rtf
-
-# If the COMPACT_RTF tag is set to YES, doxygen generates more compact RTF
-# documents. This may be useful for small projects and may help to save some
-# trees in general.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_RTF is set to YES.
-
-COMPACT_RTF            = NO
-
-# If the RTF_HYPERLINKS tag is set to YES, the RTF that is generated will
-# contain hyperlink fields. The RTF file will contain links (just like the HTML
-# output) instead of page references. This makes the output suitable for online
-# browsing using Word or some other Word compatible readers that support those
-# fields.
-#
-# Note: WordPad (write) and others do not support links.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_RTF is set to YES.
-
-RTF_HYPERLINKS         = NO
-
-# Load stylesheet definitions from file. Syntax is similar to doxygen's config
-# file, i.e. a series of assignments. You only have to provide replacements,
-# missing definitions are set to their default value.
-#
-# See also section "Doxygen usage" for information on how to generate the
-# default style sheet that doxygen normally uses.
-# This tag requires that the tag GENERATE_RTF is set to YES.
-
-RTF_STYLESHEET_FILE    =
-
-# Set optional variables used in the generation of an RTF document. Syntax is
-# similar to doxygen's config file. A template extensions file can be generated
-# using doxygen -e rtf extensionFile.
-# This tag requires that the tag GENERATE_RTF is set to YES.
-
-RTF_EXTENSIONS_FILE    =
-
-# If the RTF_SOURCE_CODE tag is set to YES then doxygen will include source code
-# with syntax highlighting in the RTF output.
-#
-# Note that which sources are shown also depends on other settings such as
-# SOURCE_BROWSER.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_RTF is set to YES.
-
-RTF_SOURCE_CODE        = NO
-
-#---------------------------------------------------------------------------
-# Configuration options related to the man page output
-#---------------------------------------------------------------------------
-
-# If the GENERATE_MAN tag is set to YES, doxygen will generate man pages for
-# classes and files.
-# The default value is: NO.
-
-GENERATE_MAN           = NO
-
-# The MAN_OUTPUT tag is used to specify where the man pages will be put. If a
-# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
-# it. A directory man3 will be created inside the directory specified by
-# MAN_OUTPUT.
-# The default directory is: man.
-# This tag requires that the tag GENERATE_MAN is set to YES.
-
-MAN_OUTPUT             = man
-
-# The MAN_EXTENSION tag determines the extension that is added to the generated
-# man pages. In case the manual section does not start with a number, the number
-# 3 is prepended. The dot (.) at the beginning of the MAN_EXTENSION tag is
-# optional.
-# The default value is: .3.
-# This tag requires that the tag GENERATE_MAN is set to YES.
-
-MAN_EXTENSION          = .3
-
-# The MAN_SUBDIR tag determines the name of the directory created within
-# MAN_OUTPUT in which the man pages are placed. If defaults to man followed by
-# MAN_EXTENSION with the initial . removed.
-# This tag requires that the tag GENERATE_MAN is set to YES.
-
-MAN_SUBDIR             =
-
-# If the MAN_LINKS tag is set to YES and doxygen generates man output, then it
-# will generate one additional man file for each entity documented in the real
-# man page(s). These additional files only source the real man page, but without
-# them the man command would be unable to find the correct page.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_MAN is set to YES.
-
-MAN_LINKS              = NO
-
-#---------------------------------------------------------------------------
-# Configuration options related to the XML output
-#---------------------------------------------------------------------------
-
-# If the GENERATE_XML tag is set to YES, doxygen will generate an XML file that
-# captures the structure of the code including all documentation.
-# The default value is: NO.
-
-GENERATE_XML           = NO
-
-# The XML_OUTPUT tag is used to specify where the XML pages will be put. If a
-# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
-# it.
-# The default directory is: xml.
-# This tag requires that the tag GENERATE_XML is set to YES.
-
-XML_OUTPUT             = xml
-
-# If the XML_PROGRAMLISTING tag is set to YES, doxygen will dump the program
-# listings (including syntax highlighting and cross-referencing information) to
-# the XML output. Note that enabling this will significantly increase the size
-# of the XML output.
-# The default value is: YES.
-# This tag requires that the tag GENERATE_XML is set to YES.
-
-XML_PROGRAMLISTING     = YES
-
-#---------------------------------------------------------------------------
-# Configuration options related to the DOCBOOK output
-#---------------------------------------------------------------------------
-
-# If the GENERATE_DOCBOOK tag is set to YES, doxygen will generate Docbook files
-# that can be used to generate PDF.
-# The default value is: NO.
-
-GENERATE_DOCBOOK       = NO
-
-# The DOCBOOK_OUTPUT tag is used to specify where the Docbook pages will be put.
-# If a relative path is entered the value of OUTPUT_DIRECTORY will be put in
-# front of it.
-# The default directory is: docbook.
-# This tag requires that the tag GENERATE_DOCBOOK is set to YES.
-
-DOCBOOK_OUTPUT         = docbook
-
-# If the DOCBOOK_PROGRAMLISTING tag is set to YES, doxygen will include the
-# program listings (including syntax highlighting and cross-referencing
-# information) to the DOCBOOK output. Note that enabling this will significantly
-# increase the size of the DOCBOOK output.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_DOCBOOK is set to YES.
-
-DOCBOOK_PROGRAMLISTING = NO
-
-#---------------------------------------------------------------------------
-# Configuration options for the AutoGen Definitions output
-#---------------------------------------------------------------------------
-
-# If the GENERATE_AUTOGEN_DEF tag is set to YES, doxygen will generate an
-# AutoGen Definitions (see http://autogen.sf.net) file that captures the
-# structure of the code including all documentation. Note that this feature is
-# still experimental and incomplete at the moment.
-# The default value is: NO.
-
-GENERATE_AUTOGEN_DEF   = NO
-
-#---------------------------------------------------------------------------
-# Configuration options related to the Perl module output
-#---------------------------------------------------------------------------
-
-# If the GENERATE_PERLMOD tag is set to YES, doxygen will generate a Perl module
-# file that captures the structure of the code including all documentation.
-#
-# Note that this feature is still experimental and incomplete at the moment.
-# The default value is: NO.
-
-GENERATE_PERLMOD       = NO
-
-# If the PERLMOD_LATEX tag is set to YES, doxygen will generate the necessary
-# Makefile rules, Perl scripts and LaTeX code to be able to generate PDF and DVI
-# output from the Perl module output.
-# The default value is: NO.
-# This tag requires that the tag GENERATE_PERLMOD is set to YES.
-
-PERLMOD_LATEX          = NO
-
-# If the PERLMOD_PRETTY tag is set to YES, the Perl module output will be nicely
-# formatted so it can be parsed by a human reader. This is useful if you want to
-# understand what is going on. On the other hand, if this tag is set to NO, the
-# size of the Perl module output will be much smaller and Perl will parse it
-# just the same.
-# The default value is: YES.
-# This tag requires that the tag GENERATE_PERLMOD is set to YES.
-
-PERLMOD_PRETTY         = YES
-
-# The names of the make variables in the generated doxyrules.make file are
-# prefixed with the string contained in PERLMOD_MAKEVAR_PREFIX. This is useful
-# so different doxyrules.make files included by the same Makefile don't
-# overwrite each other's variables.
-# This tag requires that the tag GENERATE_PERLMOD is set to YES.
-
-PERLMOD_MAKEVAR_PREFIX =
-
-#---------------------------------------------------------------------------
-# Configuration options related to the preprocessor
-#---------------------------------------------------------------------------
-
-# If the ENABLE_PREPROCESSING tag is set to YES, doxygen will evaluate all
-# C-preprocessor directives found in the sources and include files.
-# The default value is: YES.
-
-ENABLE_PREPROCESSING   = YES
-
-# If the MACRO_EXPANSION tag is set to YES, doxygen will expand all macro names
-# in the source code. If set to NO, only conditional compilation will be
-# performed. Macro expansion can be done in a controlled way by setting
-# EXPAND_ONLY_PREDEF to YES.
-# The default value is: NO.
-# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
-
-MACRO_EXPANSION        = NO
-
-# If the EXPAND_ONLY_PREDEF and MACRO_EXPANSION tags are both set to YES then
-# the macro expansion is limited to the macros specified with the PREDEFINED and
-# EXPAND_AS_DEFINED tags.
-# The default value is: NO.
-# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
-
-EXPAND_ONLY_PREDEF     = NO
-
-# If the SEARCH_INCLUDES tag is set to YES, the include files in the
-# INCLUDE_PATH will be searched if a #include is found.
-# The default value is: YES.
-# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
-
-SEARCH_INCLUDES        = YES
-
-# The INCLUDE_PATH tag can be used to specify one or more directories that
-# contain include files that are not input files but should be processed by the
-# preprocessor.
-# This tag requires that the tag SEARCH_INCLUDES is set to YES.
-
-INCLUDE_PATH           =
-
-# You can use the INCLUDE_FILE_PATTERNS tag to specify one or more wildcard
-# patterns (like *.h and *.hpp) to filter out the header-files in the
-# directories. If left blank, the patterns specified with FILE_PATTERNS will be
-# used.
-# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
-
-INCLUDE_FILE_PATTERNS  =
-
-# The PREDEFINED tag can be used to specify one or more macro names that are
-# defined before the preprocessor is started (similar to the -D option of e.g.
-# gcc). The argument of the tag is a list of macros of the form: name or
-# name=definition (no spaces). If the definition and the "=" are omitted, "=1"
-# is assumed. To prevent a macro definition from being undefined via #undef or
-# recursively expanded use the := operator instead of the = operator.
-# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
-
-PREDEFINED             =
-
-# If the MACRO_EXPANSION and EXPAND_ONLY_PREDEF tags are set to YES then this
-# tag can be used to specify a list of macro names that should be expanded. The
-# macro definition that is found in the sources will be used. Use the PREDEFINED
-# tag if you want to use a different macro definition that overrules the
-# definition found in the source code.
-# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
-
-EXPAND_AS_DEFINED      =
-
-# If the SKIP_FUNCTION_MACROS tag is set to YES then doxygen's preprocessor will
-# remove all references to function-like macros that are alone on a line, have
-# an all uppercase name, and do not end with a semicolon. Such function macros
-# are typically used for boiler-plate code, and will confuse the parser if not
-# removed.
-# The default value is: YES.
-# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
-
-SKIP_FUNCTION_MACROS   = YES
-
-#---------------------------------------------------------------------------
-# Configuration options related to external references
-#---------------------------------------------------------------------------
-
-# The TAGFILES tag can be used to specify one or more tag files. For each tag
-# file the location of the external documentation should be added. The format of
-# a tag file without this location is as follows:
-# TAGFILES = file1 file2 ...
-# Adding location for the tag files is done as follows:
-# TAGFILES = file1=loc1 "file2 = loc2" ...
-# where loc1 and loc2 can be relative or absolute paths or URLs. See the
-# section "Linking to external documentation" for more information about the use
-# of tag files.
-# Note: Each tag file must have a unique name (where the name does NOT include
-# the path). If a tag file is not located in the directory in which doxygen is
-# run, you must also specify the path to the tagfile here.
-
-TAGFILES               =
-
-# When a file name is specified after GENERATE_TAGFILE, doxygen will create a
-# tag file that is based on the input files it reads. See section "Linking to
-# external documentation" for more information about the usage of tag files.
-
-GENERATE_TAGFILE       =
-
-# If the ALLEXTERNALS tag is set to YES, all external class will be listed in
-# the class index. If set to NO, only the inherited external classes will be
-# listed.
-# The default value is: NO.
-
-ALLEXTERNALS           = NO
-
-# If the EXTERNAL_GROUPS tag is set to YES, all external groups will be listed
-# in the modules index. If set to NO, only the current project's groups will be
-# listed.
-# The default value is: YES.
-
-EXTERNAL_GROUPS        = YES
-
-# If the EXTERNAL_PAGES tag is set to YES, all external pages will be listed in
-# the related pages index. If set to NO, only the current project's pages will
-# be listed.
-# The default value is: YES.
-
-EXTERNAL_PAGES         = YES
-
-# The PERL_PATH should be the absolute path and name of the perl script
-# interpreter (i.e. the result of 'which perl').
-# The default file (with absolute path) is: /usr/bin/perl.
-
-PERL_PATH              = /usr/bin/perl
-
-#---------------------------------------------------------------------------
-# Configuration options related to the dot tool
-#---------------------------------------------------------------------------
-
-# If the CLASS_DIAGRAMS tag is set to YES, doxygen will generate a class diagram
-# (in HTML and LaTeX) for classes with base or super classes. Setting the tag to
-# NO turns the diagrams off. Note that this option also works with HAVE_DOT
-# disabled, but it is recommended to install and use dot, since it yields more
-# powerful graphs.
-# The default value is: YES.
-
-CLASS_DIAGRAMS         = YES
-
-# You can define message sequence charts within doxygen comments using the \msc
-# command. Doxygen will then run the mscgen tool (see:
-# http://www.mcternan.me.uk/mscgen/)) to produce the chart and insert it in the
-# documentation. The MSCGEN_PATH tag allows you to specify the directory where
-# the mscgen tool resides. If left empty the tool is assumed to be found in the
-# default search path.
-
-MSCGEN_PATH            =
-
-# You can include diagrams made with dia in doxygen documentation. Doxygen will
-# then run dia to produce the diagram and insert it in the documentation. The
-# DIA_PATH tag allows you to specify the directory where the dia binary resides.
-# If left empty dia is assumed to be found in the default search path.
-
-DIA_PATH               =
-
-# If set to YES the inheritance and collaboration graphs will hide inheritance
-# and usage relations if the target is undocumented or is not a class.
-# The default value is: YES.
-
-HIDE_UNDOC_RELATIONS   = YES
-
-# If you set the HAVE_DOT tag to YES then doxygen will assume the dot tool is
-# available from the path. This tool is part of Graphviz (see:
-# http://www.graphviz.org/), a graph visualization toolkit from AT&T and Lucent
-# Bell Labs. The other options in this section have no effect if this option is
-# set to NO
-# The default value is: NO.
-
-HAVE_DOT               = NO
-
-# The DOT_NUM_THREADS specifies the number of dot invocations doxygen is allowed
-# to run in parallel. When set to 0 doxygen will base this on the number of
-# processors available in the system. You can set it explicitly to a value
-# larger than 0 to get control over the balance between CPU load and processing
-# speed.
-# Minimum value: 0, maximum value: 32, default value: 0.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DOT_NUM_THREADS        = 0
-
-# When you want a differently looking font in the dot files that doxygen
-# generates you can specify the font name using DOT_FONTNAME. You need to make
-# sure dot is able to find the font, which can be done by putting it in a
-# standard location or by setting the DOTFONTPATH environment variable or by
-# setting DOT_FONTPATH to the directory containing the font.
-# The default value is: Helvetica.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DOT_FONTNAME           = Helvetica
-
-# The DOT_FONTSIZE tag can be used to set the size (in points) of the font of
-# dot graphs.
-# Minimum value: 4, maximum value: 24, default value: 10.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DOT_FONTSIZE           = 10
-
-# By default doxygen will tell dot to use the default font as specified with
-# DOT_FONTNAME. If you specify a different font using DOT_FONTNAME you can set
-# the path where dot can find it using this tag.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DOT_FONTPATH           =
-
-# If the CLASS_GRAPH tag is set to YES then doxygen will generate a graph for
-# each documented class showing the direct and indirect inheritance relations.
-# Setting this tag to YES will force the CLASS_DIAGRAMS tag to NO.
-# The default value is: YES.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-CLASS_GRAPH            = YES
-
-# If the COLLABORATION_GRAPH tag is set to YES then doxygen will generate a
-# graph for each documented class showing the direct and indirect implementation
-# dependencies (inheritance, containment, and class references variables) of the
-# class with other documented classes.
-# The default value is: YES.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-COLLABORATION_GRAPH    = YES
-
-# If the GROUP_GRAPHS tag is set to YES then doxygen will generate a graph for
-# groups, showing the direct groups dependencies.
-# The default value is: YES.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-GROUP_GRAPHS           = YES
-
-# If the UML_LOOK tag is set to YES, doxygen will generate inheritance and
-# collaboration diagrams in a style similar to the OMG's Unified Modeling
-# Language.
-# The default value is: NO.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-UML_LOOK               = NO
-
-# If the UML_LOOK tag is enabled, the fields and methods are shown inside the
-# class node. If there are many fields or methods and many nodes the graph may
-# become too big to be useful. The UML_LIMIT_NUM_FIELDS threshold limits the
-# number of items for each type to make the size more manageable. Set this to 0
-# for no limit. Note that the threshold may be exceeded by 50% before the limit
-# is enforced. So when you set the threshold to 10, up to 15 fields may appear,
-# but if the number exceeds 15, the total amount of fields shown is limited to
-# 10.
-# Minimum value: 0, maximum value: 100, default value: 10.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-UML_LIMIT_NUM_FIELDS   = 10
-
-# If the TEMPLATE_RELATIONS tag is set to YES then the inheritance and
-# collaboration graphs will show the relations between templates and their
-# instances.
-# The default value is: NO.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-TEMPLATE_RELATIONS     = NO
-
-# If the INCLUDE_GRAPH, ENABLE_PREPROCESSING and SEARCH_INCLUDES tags are set to
-# YES then doxygen will generate a graph for each documented file showing the
-# direct and indirect include dependencies of the file with other documented
-# files.
-# The default value is: YES.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-INCLUDE_GRAPH          = YES
-
-# If the INCLUDED_BY_GRAPH, ENABLE_PREPROCESSING and SEARCH_INCLUDES tags are
-# set to YES then doxygen will generate a graph for each documented file showing
-# the direct and indirect include dependencies of the file with other documented
-# files.
-# The default value is: YES.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-INCLUDED_BY_GRAPH      = YES
-
-# If the CALL_GRAPH tag is set to YES then doxygen will generate a call
-# dependency graph for every global function or class method.
-#
-# Note that enabling this option will significantly increase the time of a run.
-# So in most cases it will be better to enable call graphs for selected
-# functions only using the \callgraph command. Disabling a call graph can be
-# accomplished by means of the command \hidecallgraph.
-# The default value is: NO.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-CALL_GRAPH             = NO
-
-# If the CALLER_GRAPH tag is set to YES then doxygen will generate a caller
-# dependency graph for every global function or class method.
-#
-# Note that enabling this option will significantly increase the time of a run.
-# So in most cases it will be better to enable caller graphs for selected
-# functions only using the \callergraph command. Disabling a caller graph can be
-# accomplished by means of the command \hidecallergraph.
-# The default value is: NO.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-CALLER_GRAPH           = NO
-
-# If the GRAPHICAL_HIERARCHY tag is set to YES then doxygen will graphical
-# hierarchy of all classes instead of a textual one.
-# The default value is: YES.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-GRAPHICAL_HIERARCHY    = YES
-
-# If the DIRECTORY_GRAPH tag is set to YES then doxygen will show the
-# dependencies a directory has on other directories in a graphical way. The
-# dependency relations are determined by the #include relations between the
-# files in the directories.
-# The default value is: YES.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DIRECTORY_GRAPH        = YES
-
-# The DOT_IMAGE_FORMAT tag can be used to set the image format of the images
-# generated by dot. For an explanation of the image formats see the section
-# output formats in the documentation of the dot tool (Graphviz (see:
-# http://www.graphviz.org/)).
-# Note: If you choose svg you need to set HTML_FILE_EXTENSION to xhtml in order
-# to make the SVG files visible in IE 9+ (other browsers do not have this
-# requirement).
-# Possible values are: png, jpg, gif, svg, png:gd, png:gd:gd, png:cairo,
-# png:cairo:gd, png:cairo:cairo, png:cairo:gdiplus, png:gdiplus and
-# png:gdiplus:gdiplus.
-# The default value is: png.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DOT_IMAGE_FORMAT       = png
-
-# If DOT_IMAGE_FORMAT is set to svg, then this option can be set to YES to
-# enable generation of interactive SVG images that allow zooming and panning.
-#
-# Note that this requires a modern browser other than Internet Explorer. Tested
-# and working are Firefox, Chrome, Safari, and Opera.
-# Note: For IE 9+ you need to set HTML_FILE_EXTENSION to xhtml in order to make
-# the SVG files visible. Older versions of IE do not have SVG support.
-# The default value is: NO.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-INTERACTIVE_SVG        = NO
-
-# The DOT_PATH tag can be used to specify the path where the dot tool can be
-# found. If left blank, it is assumed the dot tool can be found in the path.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DOT_PATH               =
-
-# The DOTFILE_DIRS tag can be used to specify one or more directories that
-# contain dot files that are included in the documentation (see the \dotfile
-# command).
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DOTFILE_DIRS           =
-
-# The MSCFILE_DIRS tag can be used to specify one or more directories that
-# contain msc files that are included in the documentation (see the \mscfile
-# command).
-
-MSCFILE_DIRS           =
-
-# The DIAFILE_DIRS tag can be used to specify one or more directories that
-# contain dia files that are included in the documentation (see the \diafile
-# command).
-
-DIAFILE_DIRS           =
-
-# When using plantuml, the PLANTUML_JAR_PATH tag should be used to specify the
-# path where java can find the plantuml.jar file. If left blank, it is assumed
-# PlantUML is not used or called during a preprocessing step. Doxygen will
-# generate a warning when it encounters a \startuml command in this case and
-# will not generate output for the diagram.
-
-PLANTUML_JAR_PATH      =
-
-# When using plantuml, the PLANTUML_CFG_FILE tag can be used to specify a
-# configuration file for plantuml.
-
-PLANTUML_CFG_FILE      =
-
-# When using plantuml, the specified paths are searched for files specified by
-# the !include statement in a plantuml block.
-
-PLANTUML_INCLUDE_PATH  =
-
-# The DOT_GRAPH_MAX_NODES tag can be used to set the maximum number of nodes
-# that will be shown in the graph. If the number of nodes in a graph becomes
-# larger than this value, doxygen will truncate the graph, which is visualized
-# by representing a node as a red box. Note that doxygen if the number of direct
-# children of the root node in a graph is already larger than
-# DOT_GRAPH_MAX_NODES then the graph will not be shown at all. Also note that
-# the size of a graph can be further restricted by MAX_DOT_GRAPH_DEPTH.
-# Minimum value: 0, maximum value: 10000, default value: 50.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DOT_GRAPH_MAX_NODES    = 50
-
-# The MAX_DOT_GRAPH_DEPTH tag can be used to set the maximum depth of the graphs
-# generated by dot. A depth value of 3 means that only nodes reachable from the
-# root by following a path via at most 3 edges will be shown. Nodes that lay
-# further from the root node will be omitted. Note that setting this option to 1
-# or 2 may greatly reduce the computation time needed for large code bases. Also
-# note that the size of a graph can be further restricted by
-# DOT_GRAPH_MAX_NODES. Using a depth of 0 means no depth restriction.
-# Minimum value: 0, maximum value: 1000, default value: 0.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-MAX_DOT_GRAPH_DEPTH    = 0
-
-# Set the DOT_TRANSPARENT tag to YES to generate images with a transparent
-# background. This is disabled by default, because dot on Windows does not seem
-# to support this out of the box.
-#
-# Warning: Depending on the platform used, enabling this option may lead to
-# badly anti-aliased labels on the edges of a graph (i.e. they become hard to
-# read).
-# The default value is: NO.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DOT_TRANSPARENT        = NO
-
-# Set the DOT_MULTI_TARGETS tag to YES to allow dot to generate multiple output
-# files in one run (i.e. multiple -o and -T options on the command line). This
-# makes dot run faster, but since only newer versions of dot (>1.8.10) support
-# this, this feature is disabled by default.
-# The default value is: NO.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DOT_MULTI_TARGETS      = NO
-
-# If the GENERATE_LEGEND tag is set to YES doxygen will generate a legend page
-# explaining the meaning of the various boxes and arrows in the dot generated
-# graphs.
-# The default value is: YES.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-GENERATE_LEGEND        = YES
-
-# If the DOT_CLEANUP tag is set to YES, doxygen will remove the intermediate dot
-# files that are used to generate the various graphs.
-# The default value is: YES.
-# This tag requires that the tag HAVE_DOT is set to YES.
-
-DOT_CLEANUP            = YES
diff --git a/src/plasma/plasma_manager.cc b/src/plasma/plasma_manager.cc
deleted file mode 100644
index 51b18c572ee96..0000000000000
--- a/src/plasma/plasma_manager.cc
+++ /dev/null
@@ -1,1692 +0,0 @@
-/* PLASMA MANAGER: Local to a node, connects to other managers to send and
- * receive objects from them
- *
- * The storage manager listens on its main listening port, and if a request for
- * transfering an object to another object store comes in, it ships the data
- * using a new connection to the target object manager. */
-
-#include <fcntl.h>
-#include <stdio.h>
-#include <stdlib.h>
-#include <unistd.h>
-#include <signal.h>
-#include <stdlib.h>
-#include <sys/mman.h>
-#include <sys/types.h>
-#include <sys/socket.h>
-#include <sys/un.h>
-#include <strings.h>
-#include <poll.h>
-#include <assert.h>
-#include <netinet/in.h>
-
-/* C++ includes. */
-#include <list>
-#include <unordered_map>
-#include <unordered_set>
-#include <vector>
-
-#include "common.h"
-#include "common_protocol.h"
-#include "event_loop.h"
-#include "format/plasma_generated.h"
-#include "io.h"
-#include "net.h"
-#include "plasma/client.h"
-#include "plasma/events.h"
-#include "plasma_manager.h"
-#include "ray/gcs/client.h"
-#include "ray/util/util.h"
-#include "state/db.h"
-#include "state/db_client_table.h"
-#include "state/error_table.h"
-#include "state/object_table.h"
-#include "state/task_table.h"
-
-using plasma::ObjectLocation;
-using plasma::flatbuf::MessageType;
-
-int handle_sigpipe(plasma::Status s, int fd) {
-  if (s.ok()) {
-    return 0;
-  }
-
-  int err = errno;
-
-  switch (err) {
-  case EPIPE: {
-    ARROW_LOG(WARNING)
-        << "Received EPIPE when sending a message to client on fd " << fd
-        << ". The client on the other end may have hung up.";
-  } break;
-  case EBADF: {
-    ARROW_LOG(WARNING)
-        << "Received EBADF when sending a message to client on fd " << fd
-        << ". The client on the other end may have hung up.";
-  } break;
-  case ECONNRESET: {
-    ARROW_LOG(WARNING)
-        << "Received ECONNRESET when sending a message to client on fd " << fd
-        << ". The client on the other end may have hung up.";
-  } break;
-  case EPROTOTYPE: {
-    /* TODO(rkn): What triggers this case? */
-    ARROW_LOG(WARNING)
-        << "Received EPROTOTYPE when sending a message to client on fd " << fd
-        << ". The client on the other end may have hung up.";
-  } break;
-  default:
-    /* This code should be unreachable. */
-    RAY_CHECK(0);
-    RAY_LOG(FATAL) << "Failed to write message to client on fd " << fd;
-  }
-
-  return err;
-}
-
-/**
- * Process either the fetch or the status request.
- *
- * @param client_conn Client connection.
- * @param object_id ID of the object for which we process this request.
- * @return Void.
- */
-void process_status_request(ClientConnection *client_conn, ObjectID object_id);
-
-/**
- * Request the transfer from a remote node or get the status of
- * a given object. This is called for an object that is stored at
- * a remote Plasma Store.
- *
- * @param object_id ID of the object to transfer or to get its status.
- * @param manager_vector Array containing the Plasma Managers running at the
- *        nodes where object_id is stored.
- * @param context Client connection.
- * @return Status of object_id as defined in plasma.h
- */
-ObjectLocation request_status(ObjectID object_id,
-                              const std::vector<DBClientID> &manager_vector,
-                              void *context);
-
-/**
- * Send requested object_id back to the Plasma Manager identified
- * by (addr, port) which requested it. This is done via a
- * data Request message.
- *
- * @param loop
- * @param object_id The ID of the object being transferred to (addr, port).
- * @param addr The address of the Plasma Manager object_id is sent to.
- * @param port The port number of the Plasma Manager object_id is sent to.
- * @param conn The client connection object.
- */
-void process_transfer_request(event_loop *loop,
-                              ObjectID object_id,
-                              const char *addr,
-                              int port,
-                              ClientConnection *conn);
-
-/**
- * Receive object_id requested by this Plamsa Manager from the remote Plasma
- * Manager identified by client_sock. The object_id is sent via the data request
- * message.
- *
- * @param loop The event data structure.
- * @param client_sock The sender's socket.
- * @param object_id ID of the object being received.
- * @param data_size Size of the data of object_id.
- * @param metadata_size Size of the metadata of object_id.
- * @param conn The connection object.
- */
-void process_data_request(event_loop *loop,
-                          int client_sock,
-                          ObjectID object_id,
-                          int64_t data_size,
-                          int64_t metadata_size,
-                          ClientConnection *conn);
-
-typedef struct {
-  /** The ID of the object we are fetching or waiting for. */
-  ObjectID object_id;
-  /** Vector of the addresses of the managers containing this object. */
-  std::vector<std::string> manager_vector;
-  /** The next manager we should try to contact. This is set to an index in
-   *  manager_vector in the retry handler, in case the current attempt fails to
-   *  contact a manager. */
-  int next_manager;
-} FetchRequest;
-
-/**
- * There are fundamentally two data structures used for handling wait requests.
- * There is the "wait_request" struct and an unordered map.
- * WaitRequest keeps track of all of the object IDs that a WaitRequest is
- * waiting for. The unordered map keeps track of all of the
- * WaitRequest structs that are waiting for a particular object ID. The
- * PlasmaManagerState owns and manages the unordered maps.
- *
- * These data structures are updated by several methods:
- *   - add_wait_request_for_object adds a WaitRequest to the unordered map
- *     corresponding to a particular object ID. This is called when a client
- *     calls plasma_wait.
- *   - remove_wait_request_for_object removes a WaitRequest from an unordered
- *     map. When a wait request returns, this method is called for all of the
- *     object IDs involved in that WaitRequest.
- *   - update_object_wait_requests removes a vector of wait requests from the
- *     unordered map and does some processing for each WaitRequest involved in
- *     the vector.
- */
-struct WaitRequest {
-  WaitRequest(ClientConnection *client_conn,
-              int64_t timer,
-              int64_t num_object_requests,
-              plasma::ObjectRequestMap &&object_requests,
-              int64_t num_objects_to_wait_for,
-              int64_t num_satisfied)
-      : client_conn(client_conn),
-        timer(timer),
-        num_object_requests(num_object_requests),
-        object_requests(object_requests),
-        num_objects_to_wait_for(num_objects_to_wait_for),
-        num_satisfied(num_satisfied) {}
-
-  /** The client connection that called wait. */
-  ClientConnection *client_conn;
-  /** The ID of the timer that will time out and cause this wait to return to
-   *  the client if it hasn't already returned. */
-  int64_t timer;
-  /** The number of objects in this wait request. */
-  int64_t num_object_requests;
-  /** The object requests for this wait request. Each object request has a
-   *  status field which is either PLASMA_QUERY_LOCAL or PLASMA_QUERY_ANYWHERE.
-   */
-  plasma::ObjectRequestMap object_requests;
-  /** The minimum number of objects to wait for in this request. */
-  int64_t num_objects_to_wait_for;
-  /** The number of object requests in this wait request that are already
-   *  satisfied. */
-  int64_t num_satisfied;
-};
-
-struct PlasmaManagerState {
-  /** Event loop. */
-  event_loop *loop;
-  /** Connection to the local plasma store for reading or writing data. */
-  plasma::PlasmaClient *plasma_conn;
-  /** Hash table of all contexts for active connections to
-   *  other plasma managers. These are used for writing data to
-   *  other plasma stores. */
-  std::unordered_map<std::string, ClientConnection *> manager_connections;
-  DBHandle *db;
-  /** Our address. */
-  const char *addr;
-  /** Our port. */
-  int port;
-  /** Unordered map of outstanding fetch requests. The key is the object ID. The
-   *  value is the data needed to perform the fetch. */
-  std::unordered_map<ObjectID, FetchRequest *> fetch_requests;
-  /** Unordered map of outstanding wait requests. The key is the object ID. The
-   *  value is the vector of wait requests that are waiting for the object to
-   *  arrive locally. */
-  std::unordered_map<ObjectID, std::vector<WaitRequest *>>
-      object_wait_requests_local;
-  /** Unordered map of outstanding wait requests. The key is the object ID. The
-   *  value is the vector of wait requests that are waiting for the object to
-   *  be available somewhere in the system. */
-  std::unordered_map<ObjectID, std::vector<WaitRequest *>>
-      object_wait_requests_remote;
-  /** Initialize an empty unordered set for the cache of local available object.
-   */
-  std::unordered_set<ObjectID> local_available_objects;
-  /** The time (in milliseconds since the Unix epoch) when the most recent
-   *  heartbeat was sent. */
-  int64_t previous_heartbeat_time;
-  /** This is the set of ObjectIDs currently being transferred to this manager.
-   *  An ObjectID is added to this set if a shared buffer is
-   *  successfully created for the corresponding object.
-   *  The ObjectID is removed in process_add_object_notification, which is
-   *  triggered by the corresponding notification from the plasma store.
-   *  If an object transfer fails, only the ObjectID of the corresponding
-   *  object is removed. If object transfers between managers is parallelized,
-   *  then all objects being received from a remote manager will need to be
-   *  removed if the connection to the remote manager fails. */
-  std::unordered_set<ObjectID> receives_in_progress;
-};
-
-PlasmaManagerState *g_manager_state = NULL;
-
-/* Context for a client connection to another plasma manager. */
-struct ClientConnection {
-  /** Current state for this plasma manager. This is shared
-   *  between all client connections to the plasma manager. */
-  PlasmaManagerState *manager_state;
-  /** Current position in the buffer. */
-  int64_t cursor;
-  /** Linked list of buffers to read or write. */
-  /* TODO(swang): Split into two queues, data transfers and data requests. */
-  std::list<PlasmaRequestBuffer *> transfer_queue;
-  /* A set of object IDs which are queued in the transfer_queue and waiting to
-   * be sent. This is used to avoid sending the same object ID to the same
-   * manager multiple times. */
-  std::unordered_map<ObjectID, PlasmaRequestBuffer *> pending_object_transfers;
-  /** Buffer used to receive transfers (data fetches) we want to ignore */
-  PlasmaRequestBuffer *ignore_buffer;
-  /** File descriptor for the socket connected to the other
-   *  plasma manager. */
-  int fd;
-  /** Timer id for timing out wait (or fetch). */
-  int64_t timer_id;
-  /** The number of objects that we have left to return for
-   *  this fetch or wait operation. */
-  int num_return_objects;
-  /** Fields specific to connections to plasma managers.  Key that uniquely
-   * identifies the plasma manager that we're connected to. We will use the
-   * string <address>:<port> as an identifier. */
-  std::string ip_addr_port;
-};
-
-/**
- * Initializes the state for a plasma client connection.
- *
- * @param state The plasma manager state.
- * @param client_sock The socket that we use to communicate with the client.
- * @param client_key A string uniquely identifying the client. If the client is
- *        another plasma manager, this is the manager's IP address and port.
- *        Else, the client is the string of the client's socket.
- * @return A pointer to the initialized client state.
- */
-ClientConnection *ClientConnection_init(PlasmaManagerState *state,
-                                        int client_sock,
-                                        std::string const &client_key);
-
-/**
- * Destroys a plasma client and its connection.
- *
- * @param client_conn The client's state.
- * @return Void.
- */
-void ClientConnection_free(ClientConnection *client_conn);
-
-void ClientConnection_start_request(ClientConnection *client_conn) {
-  client_conn->cursor = 0;
-}
-
-void ClientConnection_finish_request(ClientConnection *client_conn) {
-  client_conn->cursor = -1;
-}
-
-bool ClientConnection_request_finished(ClientConnection *client_conn) {
-  return client_conn->cursor == -1;
-}
-
-std::unordered_map<ObjectID, std::vector<WaitRequest *>>
-    &object_wait_requests_from_type(PlasmaManagerState *manager_state,
-                                    plasma::ObjectRequestType type) {
-  /* We use different types of hash tables for different requests. */
-  RAY_CHECK(type == plasma::ObjectRequestType::PLASMA_QUERY_LOCAL ||
-            type == plasma::ObjectRequestType::PLASMA_QUERY_ANYWHERE);
-  if (type == plasma::ObjectRequestType::PLASMA_QUERY_LOCAL) {
-    return manager_state->object_wait_requests_local;
-  } else {
-    return manager_state->object_wait_requests_remote;
-  }
-}
-
-void add_wait_request_for_object(PlasmaManagerState *manager_state,
-                                 ObjectID object_id,
-                                 plasma::ObjectRequestType type,
-                                 WaitRequest *wait_req) {
-  auto &object_wait_requests =
-      object_wait_requests_from_type(manager_state, type);
-
-  /* Add this wait request to the vector of wait requests involving this object
-   * ID. Creates a vector of wait requests if none exist involving the object
-   * ID. */
-  object_wait_requests[object_id].push_back(wait_req);
-}
-
-void remove_wait_request_for_object(PlasmaManagerState *manager_state,
-                                    ObjectID object_id,
-                                    plasma::ObjectRequestType type,
-                                    WaitRequest *wait_req) {
-  auto &object_wait_requests =
-      object_wait_requests_from_type(manager_state, type);
-  auto object_wait_requests_it = object_wait_requests.find(object_id);
-  /* If there is a vector of wait requests for this object ID, and if this
-   * vector contains the wait request, then remove the wait request from the
-   * vector. */
-  if (object_wait_requests_it != object_wait_requests.end()) {
-    std::vector<WaitRequest *> &wait_requests = object_wait_requests_it->second;
-    for (size_t i = 0; i < wait_requests.size(); ++i) {
-      if (wait_requests[i] == wait_req) {
-        /* Remove the wait request from the array. */
-        wait_requests.erase(wait_requests.begin() + i);
-        break;
-      }
-    }
-  }
-}
-
-void remove_wait_request(PlasmaManagerState *manager_state,
-                         WaitRequest *wait_req) {
-  if (wait_req->timer != -1) {
-    RAY_CHECK(event_loop_remove_timer(manager_state->loop, wait_req->timer) ==
-              AE_OK);
-  }
-  delete wait_req;
-}
-
-void return_from_wait(PlasmaManagerState *manager_state,
-                      WaitRequest *wait_req) {
-  /* Send the reply to the client. */
-  handle_sigpipe(plasma::SendWaitReply(wait_req->client_conn->fd,
-                                       wait_req->object_requests,
-                                       wait_req->num_object_requests),
-                 wait_req->client_conn->fd);
-  /* Iterate over all object IDs requested as part of this wait request.
-   * Remove the wait request from each of the relevant object_wait_requests maps
-   * if it is present there. */
-  for (const auto &entry : wait_req->object_requests) {
-    remove_wait_request_for_object(manager_state, entry.second.object_id,
-                                   entry.second.type, wait_req);
-  }
-  /* Remove the wait request. */
-  remove_wait_request(manager_state, wait_req);
-}
-
-void update_object_wait_requests(PlasmaManagerState *manager_state,
-                                 ObjectID obj_id,
-                                 plasma::ObjectRequestType type,
-                                 ObjectLocation status) {
-  auto &object_wait_requests =
-      object_wait_requests_from_type(manager_state, type);
-  /* Update the in-progress wait requests in the specified table. */
-  auto object_wait_requests_it = object_wait_requests.find(obj_id);
-  if (object_wait_requests_it != object_wait_requests.end()) {
-    /* We compute the number of requests first because the length of the vector
-     * will change as we iterate over it (because each call to return_from_wait
-     * will remove one element). */
-    std::vector<WaitRequest *> &wait_requests = object_wait_requests_it->second;
-    int num_requests = wait_requests.size();
-    /* The argument index is the index of the current element of the vector
-     * that we are processing. It may differ from the counter i when elements
-     * are removed from the array. */
-    int index = 0;
-    for (int i = 0; i < num_requests; ++i) {
-      WaitRequest *wait_req = wait_requests[index];
-      wait_req->num_satisfied += 1;
-      /* Mark the object as present in the wait request. */
-      auto object_request =
-          wait_req->object_requests.find(obj_id.to_plasma_id());
-      /* Check that we found the object. */
-      RAY_CHECK(object_request != wait_req->object_requests.end());
-      /* Check that the object found was not previously known to us. */
-      RAY_CHECK(object_request->second.location ==
-                plasma::ObjectLocation::Nonexistent);
-      /* Update the found object's status to a known status. */
-      object_request->second.location =
-          static_cast<plasma::ObjectLocation>(status);
-
-      /* If this wait request is done, reply to the client. */
-      if (wait_req->num_satisfied == wait_req->num_objects_to_wait_for) {
-        return_from_wait(manager_state, wait_req);
-      } else {
-        /* The call to return_from_wait will remove the current element in the
-         * array, so we only increment the counter in the else branch. */
-        index += 1;
-      }
-    }
-    RAY_CHECK(static_cast<size_t>(index) == wait_requests.size());
-    /* Remove the array of wait requests for this object, since no one should be
-     * waiting for this object anymore. */
-    object_wait_requests.erase(object_wait_requests_it);
-  }
-}
-
-FetchRequest *create_fetch_request(PlasmaManagerState *manager_state,
-                                   ObjectID object_id) {
-  FetchRequest *fetch_req = new FetchRequest();
-  fetch_req->object_id = object_id;
-  return fetch_req;
-}
-
-/**
- * Remove a fetch request from the table of fetch requests.
- *
- * @param manager_state The state of the manager.
- * @param fetch_req The fetch request to remove.
- * @return Void.
- */
-void remove_fetch_request(PlasmaManagerState *manager_state,
-                          FetchRequest *fetch_req) {
-  /* Remove the fetch request from the table of fetch requests. */
-  manager_state->fetch_requests.erase(fetch_req->object_id);
-  /* Free the fetch request. */
-  delete fetch_req;
-}
-
-PlasmaManagerState *PlasmaManagerState_init(const char *store_socket_name,
-                                            const char *manager_socket_name,
-                                            const char *manager_addr,
-                                            int manager_port,
-                                            const char *redis_primary_addr,
-                                            int redis_primary_port) {
-  PlasmaManagerState *state = new PlasmaManagerState();
-  state->loop = event_loop_create();
-  state->plasma_conn = new plasma::PlasmaClient();
-  ARROW_CHECK_OK(state->plasma_conn->Connect(
-      store_socket_name, "", plasma::kPlasmaDefaultReleaseDelay));
-  if (redis_primary_addr) {
-    /* Get the manager port as a string. */
-    std::string manager_address_str =
-        std::string(manager_addr) + ":" + std::to_string(manager_port);
-
-    std::vector<std::string> db_connect_args;
-    db_connect_args.push_back("store_socket_name");
-    db_connect_args.push_back(store_socket_name);
-    db_connect_args.push_back("manager_socket_name");
-    db_connect_args.push_back(manager_socket_name);
-    db_connect_args.push_back("manager_address");
-    db_connect_args.push_back(manager_address_str);
-    state->db = db_connect(std::string(redis_primary_addr), redis_primary_port,
-                           "plasma_manager", manager_addr, db_connect_args);
-    db_attach(state->db, state->loop, false);
-  } else {
-    state->db = NULL;
-    RAY_LOG(DEBUG) << "No db connection specified";
-  }
-  state->addr = manager_addr;
-  state->port = manager_port;
-  /* Subscribe to notifications about sealed objects. */
-  int plasma_fd;
-  ARROW_CHECK_OK(state->plasma_conn->Subscribe(&plasma_fd));
-  /* Add the callback that processes the notification to the event loop. */
-  event_loop_add_file(state->loop, plasma_fd, EVENT_LOOP_READ,
-                      process_object_notification, state);
-  /* Initialize the time at which the previous heartbeat was sent. */
-  state->previous_heartbeat_time = current_time_ms();
-  return state;
-}
-
-void PlasmaManagerState_free(PlasmaManagerState *state) {
-  /* Reset the SIGTERM handler to default behavior, so we try to clean up the
-   * plasma manager at most once. */
-  signal(SIGTERM, SIG_DFL);
-  if (state->db != NULL) {
-    db_disconnect(state->db);
-    state->db = NULL;
-  }
-
-  /* We have to be careful here because ClientConnection_free modifies
-   * state->manager_connections in place. */
-  auto cc_it = state->manager_connections.begin();
-  while (cc_it != state->manager_connections.end()) {
-    auto next_it = std::next(cc_it, 1);
-    ClientConnection_free(cc_it->second);
-    cc_it = next_it;
-  }
-
-  /* We have to be careful here because remove_fetch_request modifies
-   * state->fetch_requests in place. */
-  auto it = state->fetch_requests.begin();
-  while (it != state->fetch_requests.end()) {
-    auto next_it = std::next(it, 1);
-    remove_fetch_request(state, it->second);
-    it = next_it;
-  }
-
-  ARROW_CHECK_OK(state->plasma_conn->Disconnect());
-  delete state->plasma_conn;
-
-  /* Destroy the event loop. */
-  destroy_outstanding_callbacks(state->loop);
-  event_loop_destroy(state->loop);
-  state->loop = NULL;
-
-  delete state;
-}
-
-bool is_receiving_or_received(const PlasmaManagerState *state,
-                              const ObjectID &object_id) {
-  return state->local_available_objects.count(object_id) > 0 ||
-         state->receives_in_progress.count(object_id) > 0;
-}
-
-event_loop *get_event_loop(PlasmaManagerState *state) {
-  return state->loop;
-}
-
-/* Handle a command request that came in through a socket (transfering data,
- * or accepting incoming data). */
-void process_message(event_loop *loop,
-                     int client_sock,
-                     void *context,
-                     int events);
-
-int write_object_chunk(ClientConnection *conn, PlasmaRequestBuffer *buf) {
-  ssize_t r, s;
-  /* Try to write one buf_size at a time. */
-  s = buf->data_size + buf->metadata_size - conn->cursor;
-  if (s > RayConfig::instance().buf_size()) {
-    s = RayConfig::instance().buf_size();
-  }
-  r = write(conn->fd, buf->data + conn->cursor, s);
-
-  int err;
-  if (r <= 0) {
-    RAY_LOG(ERROR) << "Write error";
-    err = errno;
-  } else {
-    conn->cursor += r;
-    RAY_CHECK(conn->cursor <= buf->data_size + buf->metadata_size);
-    /* If we've finished writing this buffer, reset the cursor. */
-    if (conn->cursor == buf->data_size + buf->metadata_size) {
-      RAY_LOG(DEBUG) << "writing on channel " << conn->fd << " finished";
-      ClientConnection_finish_request(conn);
-    }
-    err = 0;
-  }
-  return err;
-}
-
-void send_queued_request(event_loop *loop,
-                         int data_sock,
-                         void *context,
-                         int events) {
-  ClientConnection *conn = (ClientConnection *) context;
-  PlasmaManagerState *state = conn->manager_state;
-
-  if (conn->transfer_queue.size() == 0) {
-    /* If there are no objects to transfer, temporarily remove this connection
-     * from the event loop. It will be reawoken when we receive another
-     * data request. */
-    event_loop_remove_file(loop, conn->fd);
-    return;
-  }
-
-  PlasmaRequestBuffer *buf = conn->transfer_queue.front();
-  int err = 0;
-  switch (buf->type) {
-  case MessageType::PlasmaDataRequest:
-    err = handle_sigpipe(
-        plasma::SendDataRequest(conn->fd, buf->object_id.to_plasma_id(),
-                                state->addr, state->port),
-        conn->fd);
-    break;
-  case MessageType::PlasmaDataReply:
-    RAY_LOG(DEBUG) << "Transferring object to manager";
-    if (ClientConnection_request_finished(conn)) {
-      /* If the cursor is not set, we haven't sent any requests for this object
-       * yet, so send the initial data request. */
-      err = handle_sigpipe(
-          plasma::SendDataReply(conn->fd, buf->object_id.to_plasma_id(),
-                                buf->data_size, buf->metadata_size),
-          conn->fd);
-      ClientConnection_start_request(conn);
-    }
-    if (err == 0) {
-      err = write_object_chunk(conn, buf);
-    }
-    break;
-  default:
-    RAY_LOG(FATAL) << "Buffered request has unknown type.";
-  }
-
-  /* If the other side hung up, stop sending to this manager. */
-  if (err != 0) {
-    if (buf->type == MessageType::PlasmaDataReply) {
-      /* We errored while sending the object, so release it before removing the
-       * connection. The corresponding call to plasma_get occurred in
-       * process_transfer_request. */
-      ARROW_CHECK_OK(conn->manager_state->plasma_conn->Release(
-          buf->object_id.to_plasma_id()));
-    }
-    event_loop_remove_file(loop, conn->fd);
-    ClientConnection_free(conn);
-  } else if (ClientConnection_request_finished(conn)) {
-    /* If we are done with this request, remove it from the transfer queue. */
-    if (buf->type == MessageType::PlasmaDataReply) {
-      /* We are done sending the object, so release it. The corresponding call
-       * to plasma_get occurred in process_transfer_request. */
-      ARROW_CHECK_OK(conn->manager_state->plasma_conn->Release(
-          buf->object_id.to_plasma_id()));
-      /* Remove the object from the hash table of pending transfer requests. */
-      conn->pending_object_transfers.erase(buf->object_id);
-    }
-    conn->transfer_queue.pop_front();
-    delete buf;
-  }
-}
-
-int read_object_chunk(ClientConnection *conn, PlasmaRequestBuffer *buf) {
-  ssize_t r, s;
-  RAY_CHECK(buf != NULL);
-  /* Try to read one buf_size at a time. */
-  s = buf->data_size + buf->metadata_size - conn->cursor;
-  if (s > RayConfig::instance().buf_size()) {
-    s = RayConfig::instance().buf_size();
-  }
-  r = read(conn->fd, buf->data + conn->cursor, s);
-
-  int err;
-  if (r <= 0) {
-    RAY_LOG(ERROR) << "Read error";
-    err = errno;
-  } else {
-    conn->cursor += r;
-    RAY_CHECK(conn->cursor <= buf->data_size + buf->metadata_size);
-    /* If the cursor is equal to the full object size, reset the cursor and
-     * we're done. */
-    if (conn->cursor == buf->data_size + buf->metadata_size) {
-      ClientConnection_finish_request(conn);
-    }
-    err = 0;
-  }
-  return err;
-}
-
-void process_data_chunk(event_loop *loop,
-                        int data_sock,
-                        void *context,
-                        int events) {
-  /* Read the object chunk. */
-  ClientConnection *conn = (ClientConnection *) context;
-  PlasmaRequestBuffer *buf = conn->transfer_queue.front();
-  int err = read_object_chunk(conn, buf);
-  auto plasma_conn = conn->manager_state->plasma_conn;
-  if (err != 0) {
-    // Remove the object from the receives_in_progress set so that
-    // retries are processed.
-    // TODO(hme): Remove all ObjectIDs associated with this manager if we
-    // allow parallel object transfers.
-    conn->manager_state->receives_in_progress.erase(buf->object_id);
-    /* Abort the object that we were trying to read from the remote plasma
-     * manager. */
-    ARROW_CHECK_OK(plasma_conn->Release(buf->object_id.to_plasma_id()));
-    ARROW_CHECK_OK(plasma_conn->Abort(buf->object_id.to_plasma_id()));
-    /* Remove the bad connection. */
-    event_loop_remove_file(loop, data_sock);
-    ClientConnection_free(conn);
-  } else if (ClientConnection_request_finished(conn)) {
-    /* If we're done receiving the object, seal the object and release it. The
-     * release corresponds to the call to plasma_create that occurred in
-     * process_data_request. */
-    RAY_LOG(DEBUG) << "reading on channel " << data_sock << " finished";
-    /* The following seal also triggers notification of clients for fetch or
-     * wait requests, see process_object_notification. */
-    ARROW_CHECK_OK(plasma_conn->Seal(buf->object_id.to_plasma_id()));
-    ARROW_CHECK_OK(plasma_conn->Release(buf->object_id.to_plasma_id()));
-    /* Remove the request buffer used for reading this object's data. */
-    conn->transfer_queue.pop_front();
-    delete buf;
-    /* Switch to listening for requests from this socket, instead of reading
-     * object data. */
-    event_loop_remove_file(loop, data_sock);
-    bool success = event_loop_add_file(loop, data_sock, EVENT_LOOP_READ,
-                                       process_message, conn);
-    if (!success) {
-      ClientConnection_free(conn);
-    }
-  }
-}
-
-void ignore_data_chunk(event_loop *loop,
-                       int data_sock,
-                       void *context,
-                       int events) {
-  /* Read the object chunk. */
-  ClientConnection *conn = (ClientConnection *) context;
-  PlasmaRequestBuffer *buf = conn->ignore_buffer;
-
-  /* Just read the transferred data into ignore_buf and then drop (free) it. */
-  int err = read_object_chunk(conn, buf);
-  if (err != 0) {
-    event_loop_remove_file(loop, data_sock);
-    ClientConnection_free(conn);
-  } else if (ClientConnection_request_finished(conn)) {
-    free(buf->data);
-    delete buf;
-    /* Switch to listening for requests from this socket, instead of reading
-     * object data. */
-    event_loop_remove_file(loop, data_sock);
-    bool success = event_loop_add_file(loop, data_sock, EVENT_LOOP_READ,
-                                       process_message, conn);
-    if (!success) {
-      ClientConnection_free(conn);
-    }
-  }
-}
-
-ClientConnection *get_manager_connection(PlasmaManagerState *state,
-                                         const char *ip_addr,
-                                         int port) {
-  /* TODO(swang): Should probably check whether ip_addr and port belong to us.
-   */
-  std::string ip_addr_port = std::string(ip_addr) + ":" + std::to_string(port);
-  ClientConnection *manager_conn;
-  auto cc_it = state->manager_connections.find(ip_addr_port);
-  if (cc_it == state->manager_connections.end()) {
-    /* If we don't already have a connection to this manager, start one. */
-    int fd = connect_inet_sock(ip_addr, port);
-    if (fd < 0) {
-      return NULL;
-    }
-
-    manager_conn = ClientConnection_init(state, fd, ip_addr_port);
-  } else {
-    manager_conn = cc_it->second;
-  }
-  return manager_conn;
-}
-
-void process_transfer_request(event_loop *loop,
-                              ObjectID obj_id,
-                              const char *addr,
-                              int port,
-                              ClientConnection *conn) {
-  ClientConnection *manager_conn =
-      get_manager_connection(conn->manager_state, addr, port);
-  if (manager_conn == NULL) {
-    return;
-  }
-
-  /* If there is already a request in the transfer queue with the same object
-   * ID, do not add the transfer request. */
-  auto pending_it = manager_conn->pending_object_transfers.find(obj_id);
-  if (pending_it != manager_conn->pending_object_transfers.end()) {
-    return;
-  }
-
-  /* Allocate and append the request to the transfer queue. */
-  plasma::ObjectBuffer object_buffer;
-  plasma::ObjectID object_id = obj_id.to_plasma_id();
-  /* We pass in 0 to indicate that the command should return immediately. */
-  ARROW_CHECK_OK(
-      conn->manager_state->plasma_conn->Get(&object_id, 1, 0, &object_buffer));
-  if (object_buffer.data == nullptr) {
-    /* If the object wasn't locally available, exit immediately. If the object
-     * later appears locally, the requesting plasma manager should request the
-     * transfer again. */
-    RAY_LOG(WARNING) << "Unable to transfer object to requesting plasma "
-                     << "manager, object not local.";
-    return;
-  }
-
-  /* If we already have a connection to this manager and its inactive,
-   * (re)register it with the event loop again. */
-  if (manager_conn->transfer_queue.size() == 0) {
-    bool success = event_loop_add_file(loop, manager_conn->fd, EVENT_LOOP_WRITE,
-                                       send_queued_request, manager_conn);
-    if (!success) {
-      ClientConnection_free(manager_conn);
-      return;
-    }
-  }
-
-  RAY_CHECK(object_buffer.metadata->data() ==
-            object_buffer.data->data() + object_buffer.data->size());
-  PlasmaRequestBuffer *buf = new PlasmaRequestBuffer();
-  buf->type = MessageType::PlasmaDataReply;
-  buf->object_id = obj_id;
-  /* We treat buf->data as a pointer to the concatenated data and metadata, so
-   * we don't actually use buf->metadata. */
-  buf->data = const_cast<uint8_t *>(object_buffer.data->data());
-  buf->data_size = object_buffer.data->size();
-  buf->metadata_size = object_buffer.metadata->size();
-
-  manager_conn->transfer_queue.push_back(buf);
-  manager_conn->pending_object_transfers[object_id] = buf;
-}
-
-/**
- * Receive object_id requested by this Plamsa Manager from the remote Plasma
- * Manager identified by client_sock. The object_id is sent via the data requst
- * message.
- *
- * @param loop The event data structure.
- * @param client_sock The sender's socket.
- * @param object_id ID of the object being received.
- * @param data_size Size of the data of object_id.
- * @param metadata_size Size of the metadata of object_id.
- * @param conn The connection object.
- * @return Void.
- */
-void process_data_request(event_loop *loop,
-                          int client_sock,
-                          ObjectID object_id,
-                          int64_t data_size,
-                          int64_t metadata_size,
-                          ClientConnection *conn) {
-  PlasmaRequestBuffer *buf = new PlasmaRequestBuffer();
-  buf->object_id = object_id;
-  buf->data_size = data_size;
-  buf->metadata_size = metadata_size;
-
-  /* The corresponding call to plasma_release should happen in
-   * process_data_chunk. */
-  std::shared_ptr<Buffer> data;
-  plasma::Status s = conn->manager_state->plasma_conn->Create(
-      object_id.to_plasma_id(), data_size, NULL, metadata_size, &data);
-
-  /* If success_create == true, a new object has been created.
-   * If success_create == false the object creation has failed, possibly
-   * due to an object with the same ID already existing in the Plasma Store. */
-  if (s.ok()) {
-    /* Add buffer where the fetched data is to be stored to
-     * conn->transfer_queue. */
-    conn->transfer_queue.push_back(buf);
-  }
-  RAY_CHECK(ClientConnection_request_finished(conn));
-  ClientConnection_start_request(conn);
-
-  /* Switch to reading the data from this socket, instead of listening for
-   * other requests. */
-  event_loop_remove_file(loop, client_sock);
-  event_loop_file_handler data_chunk_handler;
-  if (s.ok()) {
-    // Monitor objects that are in progress of being received.
-    // If a read fails while receiving this object, its
-    // ObjectID will be removed. If the object is successfully
-    // received, its ObjectID is removed by process_add_object_notification.
-    // If a shared buffer for the object cannot be created,
-    // then the receive is ignored, and the corresponding ObjectID
-    // is not inserted into receives_in_progress.
-    conn->manager_state->receives_in_progress.insert(object_id);
-    buf->data = data->mutable_data();
-    data_chunk_handler = process_data_chunk;
-  } else {
-    /* Since plasma_create() has failed, we ignore the data transfer. We will
-     * receive this transfer in g_ignore_buf and then drop it. Allocate memory
-     * for data and metadata, if needed. All memory associated with
-     * buf/g_ignore_buf will be freed in ignore_data_chunkc(). */
-    conn->ignore_buffer = buf;
-    buf->data = (uint8_t *) malloc(buf->data_size + buf->metadata_size);
-    data_chunk_handler = ignore_data_chunk;
-  }
-
-  bool success = event_loop_add_file(loop, client_sock, EVENT_LOOP_READ,
-                                     data_chunk_handler, conn);
-  if (!success) {
-    ClientConnection_free(conn);
-  }
-}
-
-void request_transfer_from(PlasmaManagerState *manager_state,
-                           FetchRequest *fetch_req) {
-  RAY_CHECK(fetch_req->manager_vector.size() > 0);
-  RAY_CHECK(fetch_req->next_manager >= 0 &&
-            static_cast<size_t>(fetch_req->next_manager) <
-                fetch_req->manager_vector.size());
-  char addr[16];
-  int port;
-  parse_ip_addr_port(fetch_req->manager_vector[fetch_req->next_manager].c_str(),
-                     addr, &port);
-
-  ClientConnection *manager_conn =
-      get_manager_connection(manager_state, addr, port);
-  if (manager_conn != NULL) {
-    /* Check that this manager isn't trying to request an object from itself.
-     * TODO(rkn): Later this should not be fatal. */
-    uint8_t temp_addr[4];
-    sscanf(addr, "%hhu.%hhu.%hhu.%hhu", &temp_addr[0], &temp_addr[1],
-           &temp_addr[2], &temp_addr[3]);
-    if (memcmp(temp_addr, manager_state->addr, 4) == 0 &&
-        port == manager_state->port) {
-      RAY_LOG(FATAL) << "This manager is attempting to request a transfer from "
-                     << "itself.";
-    }
-
-    PlasmaRequestBuffer *transfer_request = new PlasmaRequestBuffer();
-    transfer_request->type = MessageType::PlasmaDataRequest;
-    transfer_request->object_id = fetch_req->object_id;
-
-    if (manager_conn->transfer_queue.size() == 0) {
-      /* If we already have a connection to this manager and it's inactive,
-       * (re)register it with the event loop. */
-      event_loop_add_file(manager_state->loop, manager_conn->fd,
-                          EVENT_LOOP_WRITE, send_queued_request, manager_conn);
-    }
-    /* Add this transfer request to this connection's transfer queue. */
-    manager_conn->transfer_queue.push_back(transfer_request);
-  }
-
-  /* On the next attempt, try the next manager in manager_vector. */
-  fetch_req->next_manager += 1;
-  fetch_req->next_manager %= fetch_req->manager_vector.size();
-}
-
-int fetch_timeout_handler(event_loop *loop, timer_id id, void *context) {
-  PlasmaManagerState *manager_state = (PlasmaManagerState *) context;
-
-  /* Allocate a vector of object IDs to resend requests for location
-   * notifications. */
-  int num_object_ids_to_request = 0;
-  int num_object_ids = manager_state->fetch_requests.size();
-  /* This is allocating more space than necessary, but we do not know the exact
-   * number of object IDs to request notifications for yet. */
-  ObjectID *object_ids_to_request =
-      (ObjectID *) malloc(num_object_ids * sizeof(ObjectID));
-
-  /* Loop over the fetch requests and reissue requests for objects whose
-   * locations we know. */
-  for (auto it = manager_state->fetch_requests.begin();
-       it != manager_state->fetch_requests.end(); it++) {
-    FetchRequest *fetch_req = it->second;
-    if (fetch_req->manager_vector.size() > 0) {
-      if (is_receiving_or_received(manager_state, fetch_req->object_id)) {
-        // Do nothing if the object transfer is in progress or if the object
-        // has already been received.
-        RAY_LOG(DEBUG) << "fetch_timeout_handler: Object in progress or "
-                       << "received. " << fetch_req->object_id;
-        continue;
-      }
-      RAY_LOG(DEBUG) << "fetch_timeout_handler: Object missing. "
-                     << fetch_req->object_id;
-      request_transfer_from(manager_state, fetch_req);
-      /* If we've tried all of the managers that we know about for this object,
-       * add this object to the list to resend requests for. */
-      if (fetch_req->next_manager == 0) {
-        object_ids_to_request[num_object_ids_to_request] = fetch_req->object_id;
-        ++num_object_ids_to_request;
-      }
-    }
-  }
-
-  /* Resend requests for notifications on these objects' locations. */
-  if (num_object_ids_to_request > 0 && manager_state->db != NULL) {
-    object_table_request_notifications(manager_state->db,
-                                       num_object_ids_to_request,
-                                       object_ids_to_request, NULL);
-  }
-  free(object_ids_to_request);
-
-  /* Wait at least manager_timeout_milliseconds before running this timeout
-   * handler again. But if we're waiting for a large number of objects, wait
-   * longer (e.g., 10 seconds for one million objects) so that we don't
-   * overwhelm other components like Redis with too many requests (and so that
-   * we don't overwhelm this manager with responses). */
-  return std::max(RayConfig::instance().manager_timeout_milliseconds(),
-                  int64_t(0.01 * num_object_ids));
-}
-
-bool is_object_local(PlasmaManagerState *state, ObjectID object_id) {
-  return state->local_available_objects.count(object_id) > 0;
-}
-
-void request_transfer(ObjectID object_id,
-                      const std::vector<std::string> &manager_vector,
-                      void *context) {
-  PlasmaManagerState *manager_state = (PlasmaManagerState *) context;
-  /* This callback is called from object_table_subscribe, which guarantees that
-   * the manager vector contains at least one element. */
-  RAY_CHECK(manager_vector.size() >= 1);
-  auto it = manager_state->fetch_requests.find(object_id);
-
-  if (is_object_local(manager_state, object_id)) {
-    /* If the object is already here, then the fetch request should have been
-     * removed. */
-    RAY_CHECK(it == manager_state->fetch_requests.end());
-    return;
-  }
-  FetchRequest *fetch_req = it->second;
-
-  /* If the object is not present, then the fetch request should still be here.
-   * TODO(rkn): We actually have to remove this check to handle the rare
-   * scenario where the object is transferred here and then evicted before this
-   * callback gets called. */
-  RAY_CHECK(fetch_req != NULL);
-
-  /* Update the manager vector. */
-  fetch_req->manager_vector = manager_vector;
-  fetch_req->next_manager = 0;
-  /* Wait for the object data for the default number of retries, which timeout
-   * after a default interval. */
-
-  if (!is_receiving_or_received(manager_state, object_id)) {
-    // Request object if it's not already being received,
-    // or if it has not already been received.
-    request_transfer_from(manager_state, fetch_req);
-  }
-}
-
-/* This method is only called from the tests. */
-void call_request_transfer(ObjectID object_id,
-                           const std::vector<std::string> &manager_vector,
-                           void *context) {
-  PlasmaManagerState *manager_state = (PlasmaManagerState *) context;
-  /* Check that there isn't already a fetch request for this object. */
-  auto it = manager_state->fetch_requests.find(object_id);
-  RAY_CHECK(it == manager_state->fetch_requests.end());
-  /* Create a fetch request. */
-  FetchRequest *fetch_req = create_fetch_request(manager_state, object_id);
-  manager_state->fetch_requests[object_id] = fetch_req;
-  request_transfer(object_id, manager_vector, context);
-}
-
-void fatal_table_callback(ObjectID id, void *user_context, void *user_data) {
-  RAY_CHECK(0);
-}
-
-/* This callback is used by both fetch and wait. Therefore, it may have to
- * handle outstanding fetch and wait requests. */
-void object_table_subscribe_callback(ObjectID object_id,
-                                     int64_t data_size,
-                                     const std::vector<DBClientID> &manager_ids,
-                                     void *context) {
-  PlasmaManagerState *manager_state = (PlasmaManagerState *) context;
-  const std::vector<std::string> managers =
-      db_client_table_get_ip_addresses(manager_state->db, manager_ids);
-  /* Run the callback for fetch requests if there is a fetch request. */
-  auto it = manager_state->fetch_requests.find(object_id);
-
-  if (it != manager_state->fetch_requests.end()) {
-    request_transfer(object_id, managers, context);
-  }
-  /* Run the callback for wait requests. */
-  update_object_wait_requests(manager_state, object_id,
-                              plasma::ObjectRequestType::PLASMA_QUERY_ANYWHERE,
-                              ObjectLocation::Remote);
-}
-
-void process_fetch_requests(ClientConnection *client_conn,
-                            int num_object_ids,
-                            plasma::ObjectID object_ids[]) {
-  PlasmaManagerState *manager_state = client_conn->manager_state;
-
-  int num_object_ids_to_request = 0;
-  /* This is allocating more space than necessary, but we do not know the exact
-   * number of object IDs to request notifications for yet. */
-  ObjectID *object_ids_to_request =
-      (ObjectID *) malloc(num_object_ids * sizeof(ObjectID));
-
-  for (int i = 0; i < num_object_ids; ++i) {
-    ObjectID obj_id = object_ids[i];
-
-    /* Check if this object is already present locally. If so, do nothing. */
-    if (is_object_local(manager_state, obj_id)) {
-      continue;
-    }
-
-    /* Check if this object is already being fetched. If so, do nothing. */
-    auto it = manager_state->fetch_requests.find(obj_id);
-    if (it != manager_state->fetch_requests.end()) {
-      continue;
-    }
-
-    /* Add an entry to the fetch requests data structure to indidate that the
-     * object is being fetched. */
-    FetchRequest *entry = create_fetch_request(manager_state, obj_id);
-    manager_state->fetch_requests[obj_id] = entry;
-    /* Add this object ID to the list of object IDs to request notifications for
-     * from the object table. */
-    object_ids_to_request[num_object_ids_to_request] = obj_id;
-    num_object_ids_to_request += 1;
-  }
-  if (num_object_ids_to_request > 0) {
-    /* Request notifications from the object table when these object IDs become
-     * available. The notifications will call the callback that was passed to
-     * object_table_subscribe_to_notifications, which will initiate a transfer
-     * of the object to this plasma manager. */
-    object_table_request_notifications(manager_state->db,
-                                       num_object_ids_to_request,
-                                       object_ids_to_request, NULL);
-  }
-  free(object_ids_to_request);
-}
-
-int wait_timeout_handler(event_loop *loop, timer_id id, void *context) {
-  WaitRequest *wait_req = (WaitRequest *) context;
-  return_from_wait(wait_req->client_conn->manager_state, wait_req);
-  return EVENT_LOOP_TIMER_DONE;
-}
-
-void process_wait_request(ClientConnection *client_conn,
-                          plasma::ObjectRequestMap &&object_requests,
-                          uint64_t timeout_ms,
-                          int num_ready_objects) {
-  RAY_CHECK(client_conn != NULL);
-  PlasmaManagerState *manager_state = client_conn->manager_state;
-  int num_object_requests = object_requests.size();
-
-  /* Create a wait request for this object. */
-  WaitRequest *wait_req =
-      new WaitRequest(client_conn, -1, num_object_requests,
-                      std::move(object_requests), num_ready_objects, 0);
-
-  int num_object_ids_to_request = 0;
-  /* This is allocating more space than necessary, but we do not know the exact
-   * number of object IDs to request notifications for yet. */
-  ObjectID *object_ids_to_request =
-      (ObjectID *) malloc(num_object_requests * sizeof(ObjectID));
-
-  for (auto &entry : wait_req->object_requests) {
-    auto &object_request = entry.second;
-    ObjectID obj_id = object_request.object_id;
-
-    /* Check if this object is already present locally. If so, mark the object
-     * as present. */
-    if (is_object_local(manager_state, obj_id)) {
-      object_request.location = plasma::ObjectLocation::Local;
-      wait_req->num_satisfied += 1;
-      continue;
-    }
-
-    /* Add the wait request to the relevant data structures. */
-    add_wait_request_for_object(manager_state, obj_id, object_request.type,
-                                wait_req);
-
-    if (object_request.type == plasma::ObjectRequestType::PLASMA_QUERY_LOCAL) {
-      /* TODO(rkn): If desired, we could issue a fetch command here to retrieve
-       * the object. */
-    } else if (object_request.type ==
-               plasma::ObjectRequestType::PLASMA_QUERY_ANYWHERE) {
-      /* Add this object ID to the list of object IDs to request notifications
-       * for from the object table. */
-      object_ids_to_request[num_object_ids_to_request] = obj_id;
-      num_object_ids_to_request += 1;
-    } else {
-      /* This code should be unreachable. */
-      RAY_CHECK(0);
-    }
-  }
-
-  /* If enough of the wait requests have already been satisfied, return to the
-   * client. */
-  if (wait_req->num_satisfied >= wait_req->num_objects_to_wait_for) {
-    return_from_wait(manager_state, wait_req);
-  } else {
-    if (num_object_ids_to_request > 0) {
-      /* Request notifications from the object table when these object IDs
-       * become available. The notifications will call the callback that was
-       * passed to object_table_subscribe_to_notifications, which will update
-       * the wait request. */
-      object_table_request_notifications(manager_state->db,
-                                         num_object_ids_to_request,
-                                         object_ids_to_request, NULL);
-    }
-
-    /* Set a timer that will cause the wait request to return to the client. */
-    wait_req->timer = event_loop_add_timer(manager_state->loop, timeout_ms,
-                                           wait_timeout_handler, wait_req);
-  }
-  free(object_ids_to_request);
-}
-
-/**
- * Check whether a non-local object is stored on any remot enote or not.
- *
- * @param object_id ID of the object whose status we require.
- * @param never_created True if the object has not been created yet and false
- *        otherwise.
- * @param manager_vector Vector containing the addresses of the Plasma Managers
- *        that have the object.
- * @param context Client connection.
- * @return Void.
- */
-void request_status_done(ObjectID object_id,
-                         bool never_created,
-                         const std::vector<DBClientID> &manager_vector,
-                         void *context) {
-  ClientConnection *client_conn = (ClientConnection *) context;
-  int status =
-      static_cast<int>(request_status(object_id, manager_vector, context));
-  plasma::ObjectID object_id_copy = object_id.to_plasma_id();
-  handle_sigpipe(
-      plasma::SendStatusReply(client_conn->fd, &object_id_copy, &status, 1),
-      client_conn->fd);
-}
-
-ObjectLocation request_status(ObjectID object_id,
-                              const std::vector<DBClientID> &manager_vector,
-                              void *context) {
-  ClientConnection *client_conn = (ClientConnection *) context;
-
-  /* Return success immediately if we already have this object. */
-  if (is_object_local(client_conn->manager_state, object_id)) {
-    return ObjectLocation::Local;
-  }
-
-  /* Since object is not stored at the local locally, manager_vector.size() > 0
-   * means that the object is stored at another remote object. Otherwise, if
-   * manager_vector.size() == 0, the object is not stored anywhere. */
-  return manager_vector.size() > 0 ? ObjectLocation::Remote
-                                   : ObjectLocation::Nonexistent;
-}
-
-void object_table_lookup_fail_callback(ObjectID object_id,
-                                       void *user_context,
-                                       void *user_data) {
-  /* Fail for now. Later, we may want to send a ObjectLocation::Nonexistent to
-   * the client. */
-  RAY_CHECK(0);
-}
-
-void process_status_request(ClientConnection *client_conn,
-                            plasma::ObjectID object_id) {
-  /* Return success immediately if we already have this object. */
-  if (is_object_local(client_conn->manager_state, object_id)) {
-    int status = static_cast<int>(ObjectLocation::Local);
-    handle_sigpipe(
-        plasma::SendStatusReply(client_conn->fd, &object_id, &status, 1),
-        client_conn->fd);
-    return;
-  }
-
-  if (client_conn->manager_state->db == NULL) {
-    auto status = static_cast<int>(ObjectLocation::Nonexistent);
-    handle_sigpipe(
-        plasma::SendStatusReply(client_conn->fd, &object_id, &status, 1),
-        client_conn->fd);
-    return;
-  }
-
-  /* The object is not local, so check whether it is stored remotely. */
-  object_table_lookup(client_conn->manager_state->db, object_id, NULL,
-                      request_status_done, client_conn);
-}
-
-void process_delete_object_notification(PlasmaManagerState *state,
-                                        ObjectID object_id) {
-  state->local_available_objects.erase(object_id);
-
-  /* Remove this object from the (redis) object table. */
-  if (state->db) {
-    object_table_remove(state->db, object_id, NULL, NULL, NULL, NULL);
-  }
-
-  /* NOTE: There could be pending wait requests for this object that will now
-   * return when the object is not actually available. For simplicity, we allow
-   * this scenario rather than try to keep the wait request statuses exactly
-   * up-to-date. */
-}
-
-void log_object_hash_mismatch_error_task_callback(Task *task,
-                                                  void *user_context) {
-  RAY_CHECK(task != NULL);
-  PlasmaManagerState *state = (PlasmaManagerState *) user_context;
-  TaskSpec *spec = Task_task_execution_spec(task)->Spec();
-  /* Push the error to the Python driver that caused the nondeterministic task
-   * to be submitted. */
-  std::ostringstream error_message;
-  error_message << "An object created by the task with ID "
-                << TaskSpec_task_id(spec) << " was created with a different "
-                << "hash. This may mean that a non-deterministic task was "
-                << "reexecuted.";
-  push_error(state->db, TaskSpec_driver_id(spec),
-             ErrorIndex::OBJECT_HASH_MISMATCH, error_message.str());
-}
-
-void log_object_hash_mismatch_error_result_callback(ObjectID object_id,
-                                                    TaskID task_id,
-                                                    bool is_put,
-                                                    void *user_context) {
-  RAY_CHECK(!task_id.is_nil());
-  PlasmaManagerState *state = (PlasmaManagerState *) user_context;
-  /* Get the specification for the nondeterministic task. */
-  task_table_get_task(state->db, task_id, NULL,
-                      log_object_hash_mismatch_error_task_callback, state);
-}
-
-void log_object_hash_mismatch_error_object_callback(ObjectID object_id,
-                                                    bool success,
-                                                    void *user_context) {
-  if (success) {
-    /* The object was added successfully. */
-    return;
-  }
-
-  /* The object was added, but there was an object hash mismatch. In this case,
-   * look up the task that created the object so we can notify the Python
-   * driver that the task is nondeterministic. */
-  PlasmaManagerState *state = (PlasmaManagerState *) user_context;
-  result_table_lookup(state->db, object_id, NULL,
-                      log_object_hash_mismatch_error_result_callback, state);
-}
-
-void process_add_object_notification(PlasmaManagerState *state,
-                                     ObjectID object_id,
-                                     int64_t data_size,
-                                     int64_t metadata_size,
-                                     unsigned char *digest) {
-  state->local_available_objects.insert(object_id);
-  if (state->receives_in_progress.count(object_id) > 0) {
-    // This object is now locally available, so remove it from the
-    // receives_in_progress set.
-    state->receives_in_progress.erase(object_id);
-  }
-
-  /* Add this object to the (redis) object table. */
-  if (state->db) {
-    object_table_add(state->db, object_id, data_size + metadata_size, digest,
-                     NULL, log_object_hash_mismatch_error_object_callback,
-                     (void *) state);
-  }
-
-  /* If we were trying to fetch this object, finish up the fetch request. */
-  auto it = state->fetch_requests.find(object_id);
-  if (it != state->fetch_requests.end()) {
-    remove_fetch_request(state, it->second);
-    /* TODO(rkn): We also really should unsubscribe from the object table. */
-  }
-
-  /* Update the in-progress local and remote wait requests. */
-  update_object_wait_requests(state, object_id,
-                              plasma::ObjectRequestType::PLASMA_QUERY_LOCAL,
-                              ObjectLocation::Local);
-  update_object_wait_requests(state, object_id,
-                              plasma::ObjectRequestType::PLASMA_QUERY_ANYWHERE,
-                              ObjectLocation::Local);
-}
-
-void process_object_notification(event_loop *loop,
-                                 int client_sock,
-                                 void *context,
-                                 int events) {
-  PlasmaManagerState *state = (PlasmaManagerState *) context;
-  uint8_t *notification = read_message_async(loop, client_sock);
-  if (notification == NULL) {
-    PlasmaManagerState_free(state);
-    RAY_LOG(FATAL) << "Lost connection to the plasma store, plasma manager is "
-                   << "exiting!";
-  }
-  auto object_info = flatbuffers::GetRoot<ObjectInfo>(notification);
-  /* Add object to locally available object. */
-  ObjectID object_id = from_flatbuf(*object_info->object_id());
-  if (object_info->is_deletion()) {
-    process_delete_object_notification(state, object_id);
-  } else {
-    process_add_object_notification(
-        state, object_id, object_info->data_size(),
-        object_info->metadata_size(),
-        (unsigned char *) object_info->digest()->data());
-  }
-  free(notification);
-}
-
-/* TODO(pcm): Split this into two methods: new_worker_connection
- * and new_manager_connection and also split ClientConnection
- * into two structs, one for workers and one for other plasma managers. */
-ClientConnection *ClientConnection_init(PlasmaManagerState *state,
-                                        int client_sock,
-                                        std::string const &client_key) {
-  /* Create a new data connection context per client. */
-  ClientConnection *conn = new ClientConnection();
-  conn->manager_state = state;
-  ClientConnection_finish_request(conn);
-  conn->fd = client_sock;
-  conn->num_return_objects = 0;
-
-  conn->ip_addr_port = client_key;
-  state->manager_connections[client_key] = conn;
-  return conn;
-}
-
-ClientConnection *ClientConnection_listen(event_loop *loop,
-                                          int listener_sock,
-                                          void *context,
-                                          int events) {
-  PlasmaManagerState *state = (PlasmaManagerState *) context;
-  int new_socket = accept_client(listener_sock);
-  char client_key[8];
-  snprintf(client_key, sizeof(client_key), "%d", new_socket);
-  ClientConnection *conn = ClientConnection_init(state, new_socket, client_key);
-
-  event_loop_add_file(loop, new_socket, EVENT_LOOP_READ, process_message, conn);
-  RAY_LOG(DEBUG) << "New client connection with fd " << new_socket;
-  return conn;
-}
-
-void ClientConnection_free(ClientConnection *client_conn) {
-  PlasmaManagerState *state = client_conn->manager_state;
-  state->manager_connections.erase(client_conn->ip_addr_port);
-
-  client_conn->pending_object_transfers.clear();
-
-  /* Free the transfer queue. */
-  while (client_conn->transfer_queue.size()) {
-    delete client_conn->transfer_queue.front();
-    client_conn->transfer_queue.pop_front();
-  }
-  /* Close the manager connection and free the remaining state. */
-  close(client_conn->fd);
-  delete client_conn;
-}
-
-void handle_new_client(event_loop *loop,
-                       int listener_sock,
-                       void *context,
-                       int events) {
-  (void) ClientConnection_listen(loop, listener_sock, context, events);
-}
-
-int get_client_sock(ClientConnection *conn) {
-  return conn->fd;
-}
-
-void process_message(event_loop *loop,
-                     int client_sock,
-                     void *context,
-                     int events) {
-  int64_t start_time = current_time_ms();
-
-  ClientConnection *conn = (ClientConnection *) context;
-
-  int64_t length;
-  int64_t type;
-  uint8_t *data;
-  read_message(client_sock, &type, &length, &data);
-
-  switch (static_cast<MessageType>(type)) {
-  case MessageType::PlasmaDataRequest: {
-    RAY_LOG(DEBUG) << "Processing data request";
-    plasma::ObjectID object_id;
-    char *address;
-    int port;
-    ARROW_CHECK_OK(
-        plasma::ReadDataRequest(data, length, &object_id, &address, &port));
-    process_transfer_request(loop, object_id, address, port, conn);
-    free(address);
-  } break;
-  case MessageType::PlasmaDataReply: {
-    RAY_LOG(DEBUG) << "Processing data reply";
-    plasma::ObjectID object_id;
-    int64_t object_size;
-    int64_t metadata_size;
-    ARROW_CHECK_OK(plasma::ReadDataReply(data, length, &object_id, &object_size,
-                                         &metadata_size));
-    process_data_request(loop, client_sock, object_id, object_size,
-                         metadata_size, conn);
-  } break;
-  case MessageType::PlasmaFetchRequest: {
-    RAY_LOG(DEBUG) << "Processing fetch remote";
-    std::vector<plasma::ObjectID> object_ids_to_fetch;
-    /* TODO(pcm): process_fetch_requests allocates an array of num_objects
-     * object_ids too so these should be shared in the future. */
-    ARROW_CHECK_OK(plasma::ReadFetchRequest(data, length, object_ids_to_fetch));
-    process_fetch_requests(conn, object_ids_to_fetch.size(),
-                           object_ids_to_fetch.data());
-  } break;
-  case MessageType::PlasmaWaitRequest: {
-    RAY_LOG(DEBUG) << "Processing wait";
-    plasma::ObjectRequestMap object_requests;
-    int64_t timeout_ms;
-    int num_ready_objects;
-    ARROW_CHECK_OK(plasma::ReadWaitRequest(data, length, object_requests,
-                                           &timeout_ms, &num_ready_objects));
-    process_wait_request(conn, std::move(object_requests), timeout_ms,
-                         num_ready_objects);
-  } break;
-  case MessageType::PlasmaStatusRequest: {
-    RAY_LOG(DEBUG) << "Processing status";
-    plasma::ObjectID object_id;
-    ARROW_CHECK_OK(plasma::ReadStatusRequest(data, length, &object_id, 1));
-    process_status_request(conn, object_id);
-  } break;
-  case static_cast<MessageType>(CommonMessageType::DISCONNECT_CLIENT): {
-    RAY_LOG(DEBUG) << "Disconnecting client on fd " << client_sock;
-    event_loop_remove_file(loop, client_sock);
-    ClientConnection_free(conn);
-  } break;
-  default:
-    RAY_LOG(FATAL) << "invalid request " << type;
-  }
-  free(data);
-
-  /* Print a warning if this method took too long. */
-  int64_t end_time = current_time_ms();
-  if (end_time - start_time >
-      RayConfig::instance().max_time_for_handler_milliseconds()) {
-    RAY_LOG(WARNING) << "process_message of type " << type << " took "
-                     << end_time - start_time << " milliseconds.";
-  }
-}
-
-int heartbeat_handler(event_loop *loop, timer_id id, void *context) {
-  PlasmaManagerState *state = (PlasmaManagerState *) context;
-
-  /* Check that the last heartbeat was not sent too long ago. */
-  int64_t current_time = current_time_ms();
-  RAY_CHECK(current_time >= state->previous_heartbeat_time);
-  if (current_time - state->previous_heartbeat_time >
-      RayConfig::instance().num_heartbeats_timeout() *
-          RayConfig::instance().heartbeat_timeout_milliseconds()) {
-    RAY_LOG(FATAL) << "The last heartbeat was sent "
-                   << current_time - state->previous_heartbeat_time
-                   << " milliseconds ago.";
-  }
-  state->previous_heartbeat_time = current_time;
-
-  plasma_manager_send_heartbeat(state->db);
-  return RayConfig::instance().heartbeat_timeout_milliseconds();
-}
-
-void start_server(const char *store_socket_name,
-                  const char *manager_socket_name,
-                  const char *master_addr,
-                  int port,
-                  const char *redis_primary_addr,
-                  int redis_primary_port) {
-  /* Ignore SIGPIPE signals. If we don't do this, then when we attempt to write
-   * to a client that has already died, the manager could die. */
-  signal(SIGPIPE, SIG_IGN);
-  /* Bind the sockets before we try to connect to the plasma store.
-   * In case the bind does not succeed, we want to be able to exit
-   * without breaking the pipe to the store. */
-  int remote_sock = bind_inet_sock(port, false);
-  if (remote_sock < 0) {
-    exit(EXIT_COULD_NOT_BIND_PORT);
-  }
-
-  int local_sock = bind_ipc_sock(manager_socket_name, false);
-  RAY_CHECK(local_sock >= 0) << "Unable to bind local manager socket";
-
-  g_manager_state = PlasmaManagerState_init(
-      store_socket_name, manager_socket_name, master_addr, port,
-      redis_primary_addr, redis_primary_port);
-  RAY_CHECK(g_manager_state);
-
-  RAY_CHECK(listen(remote_sock, 128) != -1);
-  RAY_CHECK(listen(local_sock, 128) != -1);
-
-  RAY_LOG(DEBUG) << "Started server connected to store " << store_socket_name
-                 << ", listening on port " << port;
-  event_loop_add_file(g_manager_state->loop, local_sock, EVENT_LOOP_READ,
-                      handle_new_client, g_manager_state);
-  event_loop_add_file(g_manager_state->loop, remote_sock, EVENT_LOOP_READ,
-                      handle_new_client, g_manager_state);
-  /* Set up a client-specific channel to receive notifications from the object
-   * table. */
-  object_table_subscribe_to_notifications(g_manager_state->db, false,
-                                          object_table_subscribe_callback,
-                                          g_manager_state, NULL, NULL, NULL);
-  /* Set up a recurring timer that will loop through the outstanding fetch
-   * requests and reissue requests for transfers of those objects. */
-  event_loop_add_timer(g_manager_state->loop,
-                       RayConfig::instance().manager_timeout_milliseconds(),
-                       fetch_timeout_handler, g_manager_state);
-  /* Publish the heartbeats to all subscribers of the plasma manager table. */
-  event_loop_add_timer(g_manager_state->loop,
-                       RayConfig::instance().heartbeat_timeout_milliseconds(),
-                       heartbeat_handler, g_manager_state);
-  /* Run the event loop. */
-  event_loop_run(g_manager_state->loop);
-}
-
-/* Report "success" to valgrind. */
-void signal_handler(int signal) {
-  RAY_LOG(DEBUG) << "Signal was " << signal;
-  if (signal == SIGTERM) {
-    if (g_manager_state) {
-      PlasmaManagerState_free(g_manager_state);
-    }
-    exit(0);
-  }
-}
-
-/* Only declare the main function if we are not in testing mode, since the test
- * suite has its own declaration of main. */
-#ifndef PLASMA_TEST
-int main(int argc, char *argv[]) {
-  InitShutdownRAII ray_log_shutdown_raii(
-      ray::RayLog::StartRayLog, ray::RayLog::ShutDownRayLog, argv[0], RAY_INFO,
-      /*log_dir=*/"");
-  ray::RayLog::InstallFailureSignalHandler();
-  signal(SIGTERM, signal_handler);
-  /* Socket name of the plasma store this manager is connected to. */
-  char *store_socket_name = NULL;
-  /* Socket name this manager will bind to. */
-  char *manager_socket_name = NULL;
-  /* IP address of this node. */
-  char *master_addr = NULL;
-  /* Port number the manager should use. */
-  int port = -1;
-  /* IP address and port of the primary redis instance. */
-  char *redis_primary_addr_port = NULL;
-  int c;
-  while ((c = getopt(argc, argv, "s:m:h:p:r:")) != -1) {
-    switch (c) {
-    case 's':
-      store_socket_name = optarg;
-      break;
-    case 'm':
-      manager_socket_name = optarg;
-      break;
-    case 'h':
-      master_addr = optarg;
-      break;
-    case 'p':
-      port = atoi(optarg);
-      break;
-    case 'r':
-      redis_primary_addr_port = optarg;
-      break;
-    default:
-      RAY_LOG(FATAL) << "unknown option " << c;
-    }
-  }
-  if (!store_socket_name) {
-    RAY_LOG(FATAL) << "please specify socket for connecting to the plasma "
-                   << "store with -s switch";
-  }
-  if (!manager_socket_name) {
-    RAY_LOG(FATAL) << "please specify socket name of the manager's local "
-                   << "socket with -m switch";
-  }
-  if (!master_addr) {
-    RAY_LOG(FATAL) << "please specify ip address of the current host in the "
-                   << "format 123.456.789.10 with -h switch";
-  }
-  if (port == -1) {
-    RAY_LOG(FATAL) << "please specify port the plasma manager shall listen to "
-                   << "in the format 12345 with -p switch";
-  }
-  char redis_primary_addr[16];
-  int redis_primary_port = -1;
-  if (!redis_primary_addr_port ||
-      parse_ip_addr_port(redis_primary_addr_port, redis_primary_addr,
-                         &redis_primary_port) == -1) {
-    RAY_LOG(FATAL) << "specify the primary redis address like 127.0.0.1:6379 "
-                   << "with the -r switch";
-  }
-  start_server(store_socket_name, manager_socket_name, master_addr, port,
-               redis_primary_addr, redis_primary_port);
-}
-#endif
diff --git a/src/plasma/plasma_manager.h b/src/plasma/plasma_manager.h
deleted file mode 100644
index 5b9b0bcc7711e..0000000000000
--- a/src/plasma/plasma_manager.h
+++ /dev/null
@@ -1,277 +0,0 @@
-#ifndef PLASMA_MANAGER_H
-#define PLASMA_MANAGER_H
-
-#include "protocol.h"
-
-#ifndef RAY_NUM_RETRIES
-#define NUM_RETRIES 5
-#else
-#define NUM_RETRIES RAY_NUM_RETRIES
-#endif
-
-typedef struct PlasmaManagerState PlasmaManagerState;
-typedef struct ClientConnection ClientConnection;
-
-/**
- * Initializes the plasma manager state. This connects the manager to the local
- * plasma store, starts the manager listening for client connections, and
- * connects the manager to a database if there is one. The returned manager
- * state should be freed using the provided PlasmaManagerState_destroy
- * function.
- *
- * @param store_socket_name The socket name used to connect to the local store.
- * @param manager_socket_name The socket name used to connect to the manager.
- * @param manager_addr Our IP address.
- * @param manager_port The IP port that we listen on.
- * @param db_addr The IP address of the database to connect to. If this is NULL,
- *        then the manager will be initialized without a database
- *        connection.
- * @param db_port The IP port of the database to connect to.
- * @return A pointer to the initialized plasma manager state.
- */
-PlasmaManagerState *PlasmaManagerState_init(const char *store_socket_name,
-                                            const char *manager_socket_name,
-                                            const char *manager_addr,
-                                            int manager_port,
-                                            const char *db_addr,
-                                            int db_port);
-
-/**
- * Destroys the plasma manager state and its connections.
- *
- * @param state A pointer to the plasma manager state to destroy.
- * @return Void.
- */
-void PlasmaManagerState_free(PlasmaManagerState *state);
-
-/**
- * Process a request from another object store manager to transfer an object.
- *
- * @param loop This is the event loop of the plasma manager.
- * @param object_id The object_id of the object we will be sending.
- * @param addr The IP address of the plasma manager to send the object to.
- * @param port The port of the plasma manager we are sending the object to.
- * @param conn The ClientConnection to the other plasma manager.
- * @return Void.
- *
- * This establishes a connection to the remote manager if one doesn't already
- * exist, and queues up the request to transfer the data to the other object
- * manager.
- */
-void process_transfer(event_loop *loop,
-                      ray::ObjectID object_id,
-                      uint8_t addr[4],
-                      int port,
-                      ClientConnection *conn);
-
-/**
- * Process a request from another object store manager to receive data.
- *
- * @param loop This is the event loop of the plasma manager.
- * @param client_sock The connection to the other plasma manager.
- * @param object_id The object_id of the object we will be reading.
- * @param data_size Size of the object.
- * @param metadata_size Size of the metadata.
- * @param conn The ClientConnection to the other plasma manager.
- * @return Void.
- *
- * Initializes the object we are going to write to in the local plasma store
- * and then switches the data socket to read the raw object bytes instead of
- * plasma requests.
- */
-void process_data(event_loop *loop,
-                  int client_sock,
-                  ray::ObjectID object_id,
-                  int64_t data_size,
-                  int64_t metadata_size,
-                  ClientConnection *conn);
-
-/**
- * Read the next chunk of the object in transit from the plasma manager
- * connected to the given socket. Once all data for this object has been read,
- * the socket switches to listening for the next plasma request.
- *
- * @param loop This is the event loop of the plasma manager.
- * @param data_sock The connection to the other plasma manager.
- * @param context The ClientConnection to the other plasma manager.
- * @return Void.
- */
-void process_data_chunk(event_loop *loop,
-                        int data_sock,
-                        void *context,
-                        int events);
-
-/**
- * Callback that will be called when a new object becomes available.
- *
- * @param loop This is the event loop of the plasma manager.
- * @param client_sock The connection to the plasma store.
- * @param context Plasma manager state.
- * @param events (unused).
- * @return Void.
- */
-void process_object_notification(event_loop *loop,
-                                 int client_sock,
-                                 void *context,
-                                 int events);
-
-/**
- * Send the next request queued for the other plasma manager connected to the
- * socket "data_sock". This could be a request to either write object data or
- * request object data. If the request is to write object data and no data has
- * been sent yet, the initial handshake to transfer the object size is
- * performed.
- *
- * @param loop This is the event loop of the plasma manager.
- * @param data_sock This is the socket the other plasma manager is listening on.
- * @param context The ClientConnection to the other plasma manager, contains a
- *        queue of objects that will be sent.
- * @return Void.
- */
-void send_queued_request(event_loop *loop,
-                         int data_sock,
-                         void *context,
-                         int events);
-
-/**
- * Register a new client connection with the plasma manager. A client can
- * either be a worker or another plasma manager.
- *
- * @param loop This is the event loop of the plasma manager.
- * @param listener_socket The socket the plasma manager is listening on.
- * @param context The plasma manager state.
- * @return Void.
- */
-ClientConnection *ClientConnection_listen(event_loop *loop,
-                                          int listener_sock,
-                                          void *context,
-                                          int events);
-
-/**
- * The following definitions are internal to the plasma manager code but are
- * needed by the unit tests in test/manager_tests.c. This includes structs
- * instantiated by the unit tests and forward declarations for functions used
- * internally by the plasma manager code.
- */
-
-/* Buffer for requests between plasma managers. */
-typedef struct PlasmaRequestBuffer {
-  plasma::flatbuf::MessageType type;
-  ray::ObjectID object_id;
-  uint8_t *data;
-  int64_t data_size;
-  uint8_t *metadata;
-  int64_t metadata_size;
-} PlasmaRequestBuffer;
-
-/**
- * Call the request_transfer method, which well attempt to get an object from
- * a remote Plasma manager. If it is unable to get it from another Plasma
- * manager, it will cycle through a list of Plasma managers that have the
- * object. This method is only called from the tests.
- *
- * @param object_id The object ID of the object to transfer.
- * @param manager_vector The Plasma managers that have the object.
- * @param context The plasma manager state.
- * @return Void.
- */
-void call_request_transfer(ray::ObjectID object_id,
-                           const std::vector<std::string> &manager_vector,
-                           void *context);
-
-/*
- * This runs periodically (every manager_timeout_milliseconds milliseconds) and
- * reissues transfer requests for all outstanding fetch requests. This is only
- * exposed so that it can be called from the tests.
- */
-int fetch_timeout_handler(event_loop *loop, timer_id id, void *context);
-
-/**
- * Get a connection to the remote manager at the specified address. Creates a
- * new connection to this manager if one doesn't already exist.
- *
- * @param state Our plasma manager state.
- * @param ip_addr The IP address of the remote manager we want to connect to.
- * @param port The port that the remote manager is listening on.
- * @return A pointer to the connection to the remote manager.
- */
-ClientConnection *get_manager_connection(PlasmaManagerState *state,
-                                         const char *ip_addr,
-                                         int port);
-
-/**
- * Reads an object chunk sent by the given client into a buffer. This is the
- * complement to write_object_chunk.
- *
- * @param conn The connection to the client who's sending the data. The
- *        connection's cursor will be reset if this is the last read for the
- *        current object.
- * @param buf The buffer to write the data into.
- * @return The errno set, if the read wasn't successful.
- */
-int read_object_chunk(ClientConnection *conn, PlasmaRequestBuffer *buf);
-
-/**
- * Writes an object chunk from a buffer to the given client. This is the
- * complement to read_object_chunk.
- *
- * @param conn The connection to the client who's receiving the data. The
- *        connection's cursor will be reset if this is the last write for the
- *        current object.
- * @param buf The buffer to read data from.
- * @return The errno set, if the write wasn't successful.
- */
-int write_object_chunk(ClientConnection *conn, PlasmaRequestBuffer *buf);
-
-/**
- * Start a new request on this connection.
- *
- * @param conn The connection on which the request is being sent.
- * @return Void.
- */
-void ClientConnection_start_request(ClientConnection *client_conn);
-
-/**
- * Finish the current request on this connection.
- *
- * @param conn The connection on which the request is being sent.
- * @return Void.
- */
-void ClientConnection_finish_request(ClientConnection *client_conn);
-
-/**
- * Check whether the current request on this connection is finished.
- *
- * @param conn The connection on which the request is being sent.
- * @return Whether the request has finished.
- */
-bool ClientConnection_request_finished(ClientConnection *client_conn);
-
-/**
- * Get the event loop of the given plasma manager state.
- *
- * @param state The state of the plasma manager whose loop we want.
- * @return A pointer to the manager's event loop.
- */
-event_loop *get_event_loop(PlasmaManagerState *state);
-
-/**
- * Get the file descriptor for the given client's socket. This is the socket
- * that the client sends or reads data through.
- *
- * @param conn The connection to the client who's sending or reading data.
- * @return A file descriptor for the socket.
- */
-int get_client_sock(ClientConnection *conn);
-
-/**
- * Return whether or not the object is local.
- *
- * @param state The state of the plasma manager.
- * @param object_id The ID of the object we want to find.
- * @return A bool that is true if the requested object is local and false
- *         otherwise.
- */
-bool is_object_local(PlasmaManagerState *state, ray::ObjectID object_id);
-
-#endif /* PLASMA_MANAGER_H */
diff --git a/src/plasma/plasma_protocol.cc b/src/plasma/plasma_protocol.cc
deleted file mode 100644
index b33ca5d343a78..0000000000000
--- a/src/plasma/plasma_protocol.cc
+++ /dev/null
@@ -1,576 +0,0 @@
-#include "flatbuffers/flatbuffers.h"
-#include "format/plasma_generated.h"
-
-#include "plasma_common.h"
-#include "plasma_protocol.h"
-#include "plasma_io.h"
-
-flatbuffers::Offset<
-    flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>>>
-to_flatbuffer(flatbuffers::FlatBufferBuilder &fbb,
-              ObjectID object_ids[],
-              int64_t num_objects) {
-  std::vector<flatbuffers::Offset<flatbuffers::String>> results;
-  for (size_t i = 0; i < num_objects; i++) {
-    results.push_back(fbb.CreateString(object_ids[i].binary()));
-  }
-  return fbb.CreateVector(results);
-}
-
-Status PlasmaReceive(int sock,
-                     int64_t message_type,
-                     std::vector<uint8_t> &buffer) {
-  int64_t type;
-  RETURN_NOT_OK(ReadMessage(sock, &type, buffer));
-  RAY_CHECK(type == message_type) << "type = " << type
-                                  << ", message_type = " << message_type;
-  return Status::OK();
-}
-
-/* Create messages. */
-
-Status SendCreateRequest(int sock,
-                         ObjectID object_id,
-                         int64_t data_size,
-                         int64_t metadata_size) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaCreateRequest(
-      fbb, fbb.CreateString(object_id.binary()), data_size, metadata_size);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaCreateRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadCreateRequest(uint8_t *data,
-                         ObjectID *object_id,
-                         int64_t *data_size,
-                         int64_t *metadata_size) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaCreateRequest>(data);
-  *data_size = message->data_size();
-  *metadata_size = message->metadata_size();
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  return Status::OK();
-}
-
-Status SendCreateReply(int sock,
-                       ObjectID object_id,
-                       PlasmaObject *object,
-                       int error_code) {
-  flatbuffers::FlatBufferBuilder fbb;
-  PlasmaObjectSpec plasma_object(
-      object->handle.store_fd, object->handle.mmap_size, object->data_offset,
-      object->data_size, object->metadata_offset, object->metadata_size);
-  auto message =
-      CreatePlasmaCreateReply(fbb, fbb.CreateString(object_id.binary()),
-                              &plasma_object, (PlasmaError) error_code);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaCreateReply, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadCreateReply(uint8_t *data,
-                       ObjectID *object_id,
-                       PlasmaObject *object) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaCreateReply>(data);
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  object->handle.store_fd = message->plasma_object()->segment_index();
-  object->handle.mmap_size = message->plasma_object()->mmap_size();
-  object->data_offset = message->plasma_object()->data_offset();
-  object->data_size = message->plasma_object()->data_size();
-  object->metadata_offset = message->plasma_object()->metadata_offset();
-  object->metadata_size = message->plasma_object()->metadata_size();
-  return plasma_error_status(message->error());
-}
-
-/* Seal messages. */
-
-Status SendSealRequest(int sock, ObjectID object_id, unsigned char *digest) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto digest_string = fbb.CreateString((char *) digest, kDigestSize);
-  auto message = CreatePlasmaSealRequest(
-      fbb, fbb.CreateString(object_id.binary()), digest_string);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaSealRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadSealRequest(uint8_t *data,
-                       ObjectID *object_id,
-                       unsigned char *digest) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaSealRequest>(data);
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  RAY_CHECK(message->digest()->size() == kDigestSize);
-  memcpy(digest, message->digest()->data(), kDigestSize);
-  return Status::OK();
-}
-
-Status SendSealReply(int sock, ObjectID object_id, int error) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaSealReply(
-      fbb, fbb.CreateString(object_id.binary()), (PlasmaError) error);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaSealReply, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadSealReply(uint8_t *data, ObjectID *object_id) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaSealReply>(data);
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  return plasma_error_status(message->error());
-}
-
-/* Release messages. */
-
-Status SendReleaseRequest(int sock, ObjectID object_id) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message =
-      CreatePlasmaReleaseRequest(fbb, fbb.CreateString(object_id.binary()));
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaReleaseRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadReleaseRequest(uint8_t *data, ObjectID *object_id) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaReleaseRequest>(data);
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  return Status::OK();
-}
-
-Status SendReleaseReply(int sock, ObjectID object_id, int error) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaReleaseReply(
-      fbb, fbb.CreateString(object_id.binary()), (PlasmaError) error);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaReleaseReply, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadReleaseReply(uint8_t *data, ObjectID *object_id) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaReleaseReply>(data);
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  return plasma_error_status(message->error());
-}
-
-/* Delete messages. */
-
-Status SendDeleteRequest(int sock, ObjectID object_id) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message =
-      CreatePlasmaDeleteRequest(fbb, fbb.CreateString(object_id.binary()));
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaDeleteRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadDeleteRequest(uint8_t *data, ObjectID *object_id) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaReleaseReply>(data);
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  return Status::OK();
-}
-
-Status SendDeleteReply(int sock, ObjectID object_id, int error) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaDeleteReply(
-      fbb, fbb.CreateString(object_id.binary()), (PlasmaError) error);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaDeleteReply, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadDeleteReply(uint8_t *data, ObjectID *object_id) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaDeleteReply>(data);
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  return plasma_error_status(message->error());
-}
-
-/* Satus messages. */
-
-Status SendStatusRequest(int sock, ObjectID object_ids[], int64_t num_objects) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaStatusRequest(
-      fbb, to_flatbuffer(fbb, object_ids, num_objects));
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaStatusRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadStatusRequest(uint8_t *data,
-                         ObjectID object_ids[],
-                         int64_t num_objects) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaStatusRequest>(data);
-  for (int64_t i = 0; i < num_objects; ++i) {
-    object_ids[i] = ObjectID::from_binary(message->object_ids()->Get(i)->str());
-  }
-  return Status::OK();
-}
-
-Status SendStatusReply(int sock,
-                       ObjectID object_ids[],
-                       ObjectStatus object_status[],
-                       int64_t num_objects) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message =
-      CreatePlasmaStatusReply(fbb, to_flatbuffer(fbb, object_ids, num_objects),
-                              fbb.CreateVector(object_status, num_objects));
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaStatusReply, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-int64_t ReadStatusReply_num_objects(uint8_t *data) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaStatusReply>(data);
-  return message->object_ids()->size();
-}
-
-Status ReadStatusReply(uint8_t *data,
-                       ObjectID object_ids[],
-                       int object_status[],
-                       int64_t num_objects) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaStatusReply>(data);
-  for (int64_t i = 0; i < num_objects; ++i) {
-    object_ids[i] = ObjectID::from_binary(message->object_ids()->Get(i)->str());
-  }
-  for (int64_t i = 0; i < num_objects; ++i) {
-    object_status[i] = message->status()->data()[i];
-  }
-  return Status::OK();
-}
-
-/* Contains messages. */
-
-Status SendContainsRequest(int sock, ObjectID object_id) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message =
-      CreatePlasmaContainsRequest(fbb, fbb.CreateString(object_id.binary()));
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaContainsRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadContainsRequest(uint8_t *data, ObjectID *object_id) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaContainsRequest>(data);
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  return Status::OK();
-}
-
-Status SendContainsReply(int sock, ObjectID object_id, int has_object) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaContainsReply(
-      fbb, fbb.CreateString(object_id.binary()), has_object);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaContainsReply, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadContainsReply(uint8_t *data, ObjectID *object_id, int *has_object) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaContainsReply>(data);
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  *has_object = message->has_object();
-  return Status::OK();
-}
-
-/* Connect messages. */
-
-Status SendConnectRequest(int sock) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaConnectRequest(fbb);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaConnectRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadConnectRequest(uint8_t *data) {
-  return Status::OK();
-}
-
-Status SendConnectReply(int sock, int64_t memory_capacity) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaConnectReply(fbb, memory_capacity);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaConnectReply, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadConnectReply(uint8_t *data, int64_t *memory_capacity) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaConnectReply>(data);
-  *memory_capacity = message->memory_capacity();
-  return Status::OK();
-}
-
-/* Evict messages. */
-
-Status SendEvictRequest(int sock, int64_t num_bytes) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaEvictRequest(fbb, num_bytes);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaEvictRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadEvictRequest(uint8_t *data, int64_t *num_bytes) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaEvictRequest>(data);
-  *num_bytes = message->num_bytes();
-  return Status::OK();
-}
-
-Status SendEvictReply(int sock, int64_t num_bytes) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaEvictReply(fbb, num_bytes);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaEvictReply, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadEvictReply(uint8_t *data, int64_t &num_bytes) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaEvictReply>(data);
-  num_bytes = message->num_bytes();
-  return Status::OK();
-}
-
-/* Get messages. */
-
-Status SendGetRequest(int sock,
-                      ObjectID object_ids[],
-                      int64_t num_objects,
-                      int64_t timeout_ms) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaGetRequest(
-      fbb, to_flatbuffer(fbb, object_ids, num_objects), timeout_ms);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaGetRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadGetRequest(uint8_t *data,
-                      std::vector<ObjectID> &object_ids,
-                      int64_t *timeout_ms) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaGetRequest>(data);
-  for (int64_t i = 0; i < message->object_ids()->size(); ++i) {
-    auto object_id = message->object_ids()->Get(i)->str();
-    object_ids.push_back(ObjectID::from_binary(object_id));
-  }
-  *timeout_ms = message->timeout_ms();
-  return Status::OK();
-}
-
-Status SendGetReply(int sock,
-                    ObjectID object_ids[],
-                    std::unordered_map<ObjectID, PlasmaObject> &plasma_objects,
-                    int64_t num_objects) {
-  flatbuffers::FlatBufferBuilder fbb;
-  std::vector<PlasmaObjectSpec> objects;
-
-  for (int i = 0; i < num_objects; ++i) {
-    const PlasmaObject &object = plasma_objects[object_ids[i]];
-    objects.push_back(PlasmaObjectSpec(
-        object.handle.store_fd, object.handle.mmap_size, object.data_offset,
-        object.data_size, object.metadata_offset, object.metadata_size));
-  }
-  auto message = CreatePlasmaGetReply(
-      fbb, to_flatbuffer(fbb, object_ids, num_objects),
-      fbb.CreateVectorOfStructs(objects.data(), num_objects));
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaGetReply, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadGetReply(uint8_t *data,
-                    ObjectID object_ids[],
-                    PlasmaObject plasma_objects[],
-                    int64_t num_objects) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaGetReply>(data);
-  for (int64_t i = 0; i < num_objects; ++i) {
-    object_ids[i] = ObjectID::from_binary(message->object_ids()->Get(i)->str());
-  }
-  for (int64_t i = 0; i < num_objects; ++i) {
-    const PlasmaObjectSpec *object = message->plasma_objects()->Get(i);
-    plasma_objects[i].handle.store_fd = object->segment_index();
-    plasma_objects[i].handle.mmap_size = object->mmap_size();
-    plasma_objects[i].data_offset = object->data_offset();
-    plasma_objects[i].data_size = object->data_size();
-    plasma_objects[i].metadata_offset = object->metadata_offset();
-    plasma_objects[i].metadata_size = object->metadata_size();
-  }
-  return Status::OK();
-}
-
-/* Fetch messages. */
-
-Status SendFetchRequest(int sock, ObjectID object_ids[], int64_t num_objects) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaFetchRequest(
-      fbb, to_flatbuffer(fbb, object_ids, num_objects));
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaFetchRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadFetchRequest(uint8_t *data, std::vector<ObjectID> &object_ids) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaFetchRequest>(data);
-  for (int64_t i = 0; i < message->object_ids()->size(); ++i) {
-    object_ids.push_back(
-        ObjectID::from_binary(message->object_ids()->Get(i)->str()));
-  }
-  return Status::OK();
-}
-
-/* Wait messages. */
-
-Status SendWaitRequest(int sock,
-                       ObjectRequest object_requests[],
-                       int num_requests,
-                       int num_ready_objects,
-                       int64_t timeout_ms) {
-  flatbuffers::FlatBufferBuilder fbb;
-
-  std::vector<flatbuffers::Offset<ObjectRequestSpec>> object_request_specs;
-  for (int i = 0; i < num_requests; i++) {
-    object_request_specs.push_back(CreateObjectRequestSpec(
-        fbb, fbb.CreateString(object_requests[i].object_id.binary()),
-        object_requests[i].type));
-  }
-
-  auto message =
-      CreatePlasmaWaitRequest(fbb, fbb.CreateVector(object_request_specs),
-                              num_ready_objects, timeout_ms);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaWaitRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadWaitRequest(uint8_t *data,
-                       ObjectRequestMap &object_requests,
-                       int64_t *timeout_ms,
-                       int *num_ready_objects) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaWaitRequest>(data);
-  *num_ready_objects = message->num_ready_objects();
-  *timeout_ms = message->timeout();
-
-  for (int i = 0; i < message->object_requests()->size(); i++) {
-    ObjectID object_id = ObjectID::from_binary(
-        message->object_requests()->Get(i)->object_id()->str());
-    ObjectRequest object_request({object_id,
-                                  message->object_requests()->Get(i)->type(),
-                                  ObjectStatus_Nonexistent});
-    object_requests[object_id] = object_request;
-  }
-  return Status::OK();
-}
-
-Status SendWaitReply(int sock,
-                     const ObjectRequestMap &object_requests,
-                     int num_ready_objects) {
-  flatbuffers::FlatBufferBuilder fbb;
-
-  std::vector<flatbuffers::Offset<ObjectReply>> object_replies;
-  for (const auto &entry : object_requests) {
-    const auto &object_request = entry.second;
-    object_replies.push_back(CreateObjectReply(
-        fbb, fbb.CreateString(object_request.object_id.binary()),
-        object_request.status));
-  }
-
-  auto message = CreatePlasmaWaitReply(
-      fbb, fbb.CreateVector(object_replies.data(), num_ready_objects),
-      num_ready_objects);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaWaitReply, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadWaitReply(uint8_t *data,
-                     ObjectRequest object_requests[],
-                     int *num_ready_objects) {
-  RAY_DCHECK(data);
-
-  auto message = flatbuffers::GetRoot<PlasmaWaitReply>(data);
-  *num_ready_objects = message->num_ready_objects();
-  for (int i = 0; i < *num_ready_objects; i++) {
-    object_requests[i].object_id = ObjectID::from_binary(
-        message->object_requests()->Get(i)->object_id()->str());
-    object_requests[i].status = message->object_requests()->Get(i)->status();
-  }
-  return Status::OK();
-}
-
-/* Subscribe messages. */
-
-Status SendSubscribeRequest(int sock) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaSubscribeRequest(fbb);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaSubscribeRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-/* Data messages. */
-
-Status SendDataRequest(int sock,
-                       ObjectID object_id,
-                       const char *address,
-                       int port) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto addr = fbb.CreateString((char *) address, strlen(address));
-  auto message = CreatePlasmaDataRequest(
-      fbb, fbb.CreateString(object_id.binary()), addr, port);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaDataRequest, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadDataRequest(uint8_t *data,
-                       ObjectID *object_id,
-                       char **address,
-                       int *port) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaDataRequest>(data);
-  RAY_DCHECK(message->object_id()->size() == sizeof(ObjectID));
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  *address = strdup(message->address()->c_str());
-  *port = message->port();
-  return Status::OK();
-}
-
-Status SendDataReply(int sock,
-                     ObjectID object_id,
-                     int64_t object_size,
-                     int64_t metadata_size) {
-  flatbuffers::FlatBufferBuilder fbb;
-  auto message = CreatePlasmaDataReply(
-      fbb, fbb.CreateString(object_id.binary()), object_size, metadata_size);
-  fbb.Finish(message);
-  return WriteMessage(sock, MessageType::PlasmaDataReply, fbb.GetSize(),
-                      fbb.GetBufferPointer());
-}
-
-Status ReadDataReply(uint8_t *data,
-                     ObjectID *object_id,
-                     int64_t *object_size,
-                     int64_t *metadata_size) {
-  RAY_DCHECK(data);
-  auto message = flatbuffers::GetRoot<PlasmaDataReply>(data);
-  *object_id = ObjectID::from_binary(message->object_id()->str());
-  *object_size = (int64_t) message->object_size();
-  *metadata_size = (int64_t) message->metadata_size();
-  return Status::OK();
-}
diff --git a/src/plasma/protocol.h b/src/plasma/protocol.h
deleted file mode 100644
index 89f1256b38e8a..0000000000000
--- a/src/plasma/protocol.h
+++ /dev/null
@@ -1,77 +0,0 @@
-#ifndef PLASMA_PROTOCOL_H
-#define PLASMA_PROTOCOL_H
-
-#include "./format/common_generated.h"
-#include "./format/plasma_generated.h"
-
-namespace plasma {
-
-namespace flatbuf {
-enum class MessageType : int64_t;
-};
-
-using arrow::Status;
-
-typedef std::unordered_map<ObjectID, ObjectRequest> ObjectRequestMap;
-
-Status PlasmaReceive(int sock,
-                     flatbuf::MessageType message_type,
-                     std::vector<uint8_t> *buffer);
-
-Status SendWaitReply(int sock,
-                     const ObjectRequestMap &object_requests,
-                     int num_ready_objects);
-
-Status SendStatusReply(int sock,
-                       ObjectID object_ids[],
-                       int object_status[],
-                       int64_t num_objects);
-
-Status SendDataRequest(int sock,
-                       ObjectID object_id,
-                       const char *address,
-                       int port);
-
-Status SendDataReply(int sock,
-                     ObjectID object_id,
-                     int64_t object_size,
-                     int64_t metadata_size);
-
-Status ReadDataRequest(uint8_t *data,
-                       size_t size,
-                       ObjectID *object_id,
-                       char **address,
-                       int *port);
-
-Status ReadDataReply(uint8_t *data,
-                     size_t size,
-                     ObjectID *object_id,
-                     int64_t *object_size,
-                     int64_t *metadata_size);
-
-Status ReadFetchRequest(uint8_t *data,
-                        size_t size,
-                        std::vector<ObjectID> &object_ids);
-
-Status ReadStatusRequest(uint8_t *data,
-                         size_t size,
-                         ObjectID object_ids[],
-                         int64_t num_objects);
-
-Status ReadWaitRequest(uint8_t *data,
-                       size_t size,
-                       ObjectRequestMap &object_requests,
-                       int64_t *timeout_ms,
-                       int *num_ready_objects);
-
-Status ReadStatusRequest(uint8_t *data,
-                         size_t size,
-                         ObjectID object_ids[],
-                         int64_t num_objects);
-
-std::unique_ptr<uint8_t[]> CreateObjectInfoBuffer(
-    flatbuf::ObjectInfoT *object_info);
-
-}  // namespace plasma
-
-#endif
diff --git a/src/plasma/setup-env.sh b/src/plasma/setup-env.sh
deleted file mode 100644
index a1b2cb4b1a594..0000000000000
--- a/src/plasma/setup-env.sh
+++ /dev/null
@@ -1,5 +0,0 @@
-echo "Adding Plasma to PYTHONPATH" 1>&2
-
-ROOT_DIR=$(cd "$(dirname "${BASH_SOURCE:-$0}")"; pwd)
-
-export PYTHONPATH="$ROOT_DIR/lib/python/:$PYTHONPATH"
diff --git a/src/plasma/setup.py b/src/plasma/setup.py
deleted file mode 100644
index 2a6d3b1608340..0000000000000
--- a/src/plasma/setup.py
+++ /dev/null
@@ -1,35 +0,0 @@
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-from setuptools import setup, find_packages
-import setuptools.command.install as _install
-
-import subprocess
-
-
-class install(_install.install):
-    def run(self):
-        subprocess.check_call(["make"])
-        subprocess.check_call(["cp", "build/plasma_store",
-                               "plasma/plasma_store"])
-        subprocess.check_call(["cp", "build/plasma_manager",
-                               "plasma/plasma_manager"])
-        subprocess.check_call(["cmake", ".."], cwd="./build")
-        subprocess.check_call(["make", "install"], cwd="./build")
-        # Calling _install.install.run(self) does not fetch required packages
-        # and instead performs an old-style install. See command/install.py in
-        # setuptools. So, calling do_egg_install() manually here.
-        self.do_egg_install()
-
-
-setup(name="Plasma",
-      version="0.0.1",
-      description="Plasma client for Python",
-      packages=find_packages(),
-      package_data={"plasma": ["plasma_store",
-                               "plasma_manager",
-                               "libplasma.so"]},
-      cmdclass={"install": install},
-      include_package_data=True,
-      zip_safe=False)
diff --git a/src/plasma/test/client_tests.cc b/src/plasma/test/client_tests.cc
deleted file mode 100644
index 871b1d6249aa1..0000000000000
--- a/src/plasma/test/client_tests.cc
+++ /dev/null
@@ -1,337 +0,0 @@
-#include "greatest.h"
-
-#include <assert.h>
-#include <unistd.h>
-#include <sys/time.h>
-
-#include "plasma/test-util.h"
-
-#include "plasma/common.h"
-#include "plasma/client.h"
-
-using namespace plasma;
-
-SUITE(plasma_client_tests);
-
-TEST plasma_status_tests(void) {
-  PlasmaClient client1;
-  ARROW_CHECK_OK(client1.Connect("/tmp/store1", "/tmp/manager1",
-                                 plasma::kPlasmaDefaultReleaseDelay));
-  PlasmaClient client2;
-  ARROW_CHECK_OK(client2.Connect("/tmp/store2", "/tmp/manager2",
-                                 plasma::kPlasmaDefaultReleaseDelay));
-  ObjectID oid1 = random_object_id();
-
-  /* Test for object non-existence. */
-  int status;
-  ARROW_CHECK_OK(client1.Info(oid1, &status));
-  ASSERT(status == static_cast<int>(ObjectLocation::Nonexistent));
-
-  /* Test for the object being in local Plasma store. */
-  /* First create object. */
-  int64_t data_size = 100;
-  uint8_t metadata[] = {5};
-  int64_t metadata_size = sizeof(metadata);
-  std::shared_ptr<Buffer> data;
-  ARROW_CHECK_OK(
-      client1.Create(oid1, data_size, metadata, metadata_size, &data));
-  ARROW_CHECK_OK(client1.Seal(oid1));
-  /* Sleep to avoid race condition of Plasma Manager waiting for notification.
-   */
-  sleep(1);
-  ARROW_CHECK_OK(client1.Info(oid1, &status));
-  ASSERT(status == static_cast<int>(ObjectLocation::Local));
-
-  /* Test for object being remote. */
-  ARROW_CHECK_OK(client2.Info(oid1, &status));
-  ASSERT(status == static_cast<int>(ObjectLocation::Remote));
-
-  ARROW_CHECK_OK(client1.Disconnect());
-  ARROW_CHECK_OK(client2.Disconnect());
-
-  PASS();
-}
-
-TEST plasma_fetch_tests(void) {
-  PlasmaClient client1;
-  ARROW_CHECK_OK(client1.Connect("/tmp/store1", "/tmp/manager1",
-                                 plasma::kPlasmaDefaultReleaseDelay));
-  PlasmaClient client2;
-  ARROW_CHECK_OK(client2.Connect("/tmp/store2", "/tmp/manager2",
-                                 plasma::kPlasmaDefaultReleaseDelay));
-  ObjectID oid1 = random_object_id();
-
-  /* Test for object non-existence. */
-  int status;
-
-  /* No object in the system */
-  ARROW_CHECK_OK(client1.Info(oid1, &status));
-  ASSERT(status == static_cast<int>(ObjectLocation::Nonexistent));
-
-  /* Test for the object being in local Plasma store. */
-  /* First create object. */
-  int64_t data_size = 100;
-  uint8_t metadata[] = {5};
-  int64_t metadata_size = sizeof(metadata);
-  std::shared_ptr<Buffer> data;
-  ARROW_CHECK_OK(
-      client1.Create(oid1, data_size, metadata, metadata_size, &data));
-  ARROW_CHECK_OK(client1.Seal(oid1));
-
-  /* Object with ID oid1 has been just inserted. On the next fetch we might
-   * either find the object or not, depending on whether the Plasma Manager has
-   * received the notification from the Plasma Store or not. */
-  ObjectID oid_array1[1] = {oid1};
-  ARROW_CHECK_OK(client1.Fetch(1, oid_array1));
-  ARROW_CHECK_OK(client1.Info(oid1, &status));
-  ASSERT(status == static_cast<int>(ObjectLocation::Local) ||
-         status == static_cast<int>(ObjectLocation::Nonexistent));
-
-  /* Sleep to make sure Plasma Manager got the notification. */
-  sleep(1);
-  ARROW_CHECK_OK(client1.Info(oid1, &status));
-  ASSERT(status == static_cast<int>(ObjectLocation::Local));
-
-  /* Test for object being remote. */
-  ARROW_CHECK_OK(client2.Info(oid1, &status));
-  ASSERT(status == static_cast<int>(ObjectLocation::Remote));
-
-  /* Sleep to make sure the object has been fetched and it is now stored in the
-   * local Plasma Store. */
-  ARROW_CHECK_OK(client2.Fetch(1, oid_array1));
-  sleep(1);
-  ARROW_CHECK_OK(client2.Info(oid1, &status));
-  ASSERT(status == static_cast<int>(ObjectLocation::Local));
-
-  sleep(1);
-  ARROW_CHECK_OK(client1.Disconnect());
-  ARROW_CHECK_OK(client2.Disconnect());
-
-  PASS();
-}
-
-void init_data_123(uint8_t *data, uint64_t size, uint8_t base) {
-  for (size_t i = 0; i < size; i++) {
-    data[i] = base + i;
-  }
-}
-
-bool is_equal_data_123(const uint8_t *data1,
-                       const uint8_t *data2,
-                       uint64_t size) {
-  for (size_t i = 0; i < size; i++) {
-    if (data1[i] != data2[i]) {
-      return false;
-    };
-  }
-  return true;
-}
-
-TEST plasma_nonblocking_get_tests(void) {
-  PlasmaClient client;
-  ARROW_CHECK_OK(client.Connect("/tmp/store1", "/tmp/manager1",
-                                plasma::kPlasmaDefaultReleaseDelay));
-  ObjectID oid = random_object_id();
-  ObjectID oid_array[1] = {oid};
-  ObjectBuffer obj_buffer;
-
-  /* Test for object non-existence. */
-  ARROW_CHECK_OK(client.Get(oid_array, 1, 0, &obj_buffer));
-  ASSERT(obj_buffer.data == nullptr);
-
-  /* Test for the object being in local Plasma store. */
-  /* First create object. */
-  int64_t data_size = 4;
-  uint8_t metadata[] = {5};
-  int64_t metadata_size = sizeof(metadata);
-  std::shared_ptr<Buffer> data;
-  ARROW_CHECK_OK(client.Create(oid, data_size, metadata, metadata_size, &data));
-  init_data_123(data->mutable_data(), data_size, 0);
-  ARROW_CHECK_OK(client.Seal(oid));
-
-  sleep(1);
-  ARROW_CHECK_OK(client.Get(oid_array, 1, 0, &obj_buffer));
-  ASSERT(is_equal_data_123(data->data(), obj_buffer.data->data(), data_size) ==
-         true);
-
-  sleep(1);
-  ARROW_CHECK_OK(client.Disconnect());
-
-  PASS();
-}
-
-TEST plasma_wait_for_objects_tests(void) {
-  PlasmaClient client1;
-  ARROW_CHECK_OK(client1.Connect("/tmp/store1", "/tmp/manager1",
-                                 plasma::kPlasmaDefaultReleaseDelay));
-  PlasmaClient client2;
-  ARROW_CHECK_OK(client2.Connect("/tmp/store2", "/tmp/manager2",
-                                 plasma::kPlasmaDefaultReleaseDelay));
-  ObjectID oid1 = random_object_id();
-  ObjectID oid2 = random_object_id();
-#define NUM_OBJ_REQUEST 2
-#define WAIT_TIMEOUT_MS 1000
-  ObjectRequest obj_requests[NUM_OBJ_REQUEST];
-
-  obj_requests[0].object_id = oid1;
-  obj_requests[0].type = ObjectRequestType::PLASMA_QUERY_ANYWHERE;
-  obj_requests[1].object_id = oid2;
-  obj_requests[1].type = ObjectRequestType::PLASMA_QUERY_ANYWHERE;
-
-  struct timeval start, end;
-  gettimeofday(&start, NULL);
-  int n;
-  ARROW_CHECK_OK(client1.Wait(NUM_OBJ_REQUEST, obj_requests, NUM_OBJ_REQUEST,
-                              WAIT_TIMEOUT_MS, &n));
-  ASSERT(n == 0);
-  gettimeofday(&end, NULL);
-  float diff_ms = (end.tv_sec - start.tv_sec);
-  diff_ms = (((diff_ms * 1000000.) + end.tv_usec) - (start.tv_usec)) / 1000.;
-  /* Reduce threshold by 10% to make sure we pass consistently. */
-  ASSERT(diff_ms > WAIT_TIMEOUT_MS * 0.9);
-
-  /* Create and insert an object in plasma_conn1. */
-  int64_t data_size = 4;
-  uint8_t metadata[] = {5};
-  int64_t metadata_size = sizeof(metadata);
-  std::shared_ptr<Buffer> data;
-  ARROW_CHECK_OK(
-      client1.Create(oid1, data_size, metadata, metadata_size, &data));
-  ARROW_CHECK_OK(client1.Seal(oid1));
-
-  ARROW_CHECK_OK(client1.Wait(NUM_OBJ_REQUEST, obj_requests, NUM_OBJ_REQUEST,
-                              WAIT_TIMEOUT_MS, &n));
-  ASSERT(n == 1);
-
-  /* Create and insert an object in client2. */
-  ARROW_CHECK_OK(
-      client2.Create(oid2, data_size, metadata, metadata_size, &data));
-  ARROW_CHECK_OK(client2.Seal(oid2));
-
-  ARROW_CHECK_OK(client1.Wait(NUM_OBJ_REQUEST, obj_requests, NUM_OBJ_REQUEST,
-                              WAIT_TIMEOUT_MS, &n));
-  ASSERT(n == 2);
-
-  ARROW_CHECK_OK(client2.Wait(NUM_OBJ_REQUEST, obj_requests, NUM_OBJ_REQUEST,
-                              WAIT_TIMEOUT_MS, &n));
-  ASSERT(n == 2);
-
-  obj_requests[0].type = ObjectRequestType::PLASMA_QUERY_LOCAL;
-  obj_requests[1].type = ObjectRequestType::PLASMA_QUERY_LOCAL;
-  ARROW_CHECK_OK(client1.Wait(NUM_OBJ_REQUEST, obj_requests, NUM_OBJ_REQUEST,
-                              WAIT_TIMEOUT_MS, &n));
-  ASSERT(n == 1);
-
-  ARROW_CHECK_OK(client2.Wait(NUM_OBJ_REQUEST, obj_requests, NUM_OBJ_REQUEST,
-                              WAIT_TIMEOUT_MS, &n));
-  ASSERT(n == 1);
-
-  ARROW_CHECK_OK(client1.Disconnect());
-  ARROW_CHECK_OK(client2.Disconnect());
-
-  PASS();
-}
-
-TEST plasma_get_tests(void) {
-  PlasmaClient client1, client2;
-  ARROW_CHECK_OK(client1.Connect("/tmp/store1", "/tmp/manager1",
-                                 plasma::kPlasmaDefaultReleaseDelay));
-  ARROW_CHECK_OK(client2.Connect("/tmp/store2", "/tmp/manager2",
-                                 plasma::kPlasmaDefaultReleaseDelay));
-  ObjectID oid1 = random_object_id();
-  ObjectID oid2 = random_object_id();
-  ObjectBuffer obj_buffer1;
-
-  ObjectID oid_array1[1] = {oid1};
-  ObjectID oid_array2[1] = {oid2};
-
-  int64_t data_size = 4;
-  uint8_t metadata[] = {5};
-  int64_t metadata_size = sizeof(metadata);
-  std::shared_ptr<Buffer> data;
-  ARROW_CHECK_OK(
-      client1.Create(oid1, data_size, metadata, metadata_size, &data));
-  init_data_123(data->mutable_data(), data_size, 1);
-  ARROW_CHECK_OK(client1.Seal(oid1));
-
-  ARROW_CHECK_OK(client1.Get(oid_array1, 1, -1, &obj_buffer1));
-  ASSERT(data->data()[0] == obj_buffer1.data->data()[0]);
-
-  ObjectBuffer obj_buffer2;
-  ARROW_CHECK_OK(
-      client2.Create(oid2, data_size, metadata, metadata_size, &data));
-  init_data_123(data->mutable_data(), data_size, 2);
-  ARROW_CHECK_OK(client2.Seal(oid2));
-
-  ARROW_CHECK_OK(client1.Fetch(1, oid_array2));
-  ARROW_CHECK_OK(client1.Get(oid_array2, 1, -1, &obj_buffer2));
-  ASSERT(data->data()[0] == obj_buffer2.data->data()[0]);
-
-  sleep(1);
-  ARROW_CHECK_OK(client1.Disconnect());
-  ARROW_CHECK_OK(client2.Disconnect());
-
-  PASS();
-}
-
-TEST plasma_get_multiple_tests(void) {
-  PlasmaClient client1, client2;
-  ARROW_CHECK_OK(client1.Connect("/tmp/store1", "/tmp/manager1",
-                                 plasma::kPlasmaDefaultReleaseDelay));
-  ARROW_CHECK_OK(client2.Connect("/tmp/store2", "/tmp/manager2",
-                                 plasma::kPlasmaDefaultReleaseDelay));
-  ObjectID oid1 = random_object_id();
-  ObjectID oid2 = random_object_id();
-  ObjectID obj_ids[NUM_OBJ_REQUEST];
-  ObjectBuffer obj_buffer[NUM_OBJ_REQUEST];
-  int obj1_first = 1, obj2_first = 2;
-
-  obj_ids[0] = oid1;
-  obj_ids[1] = oid2;
-
-  int64_t data_size = 4;
-  uint8_t metadata[] = {5};
-  int64_t metadata_size = sizeof(metadata);
-  std::shared_ptr<Buffer> data;
-  ARROW_CHECK_OK(
-      client1.Create(oid1, data_size, metadata, metadata_size, &data));
-  init_data_123(data->mutable_data(), data_size, obj1_first);
-  ARROW_CHECK_OK(client1.Seal(oid1));
-
-  /* This only waits for oid1. */
-  ARROW_CHECK_OK(client1.Get(obj_ids, 1, -1, obj_buffer));
-  ASSERT(data->data()[0] == obj_buffer[0].data->data()[0]);
-
-  ARROW_CHECK_OK(
-      client2.Create(oid2, data_size, metadata, metadata_size, &data));
-  init_data_123(data->mutable_data(), data_size, obj2_first);
-  ARROW_CHECK_OK(client2.Seal(oid2));
-
-  ARROW_CHECK_OK(client1.Fetch(2, obj_ids));
-  ARROW_CHECK_OK(client1.Get(obj_ids, 2, -1, obj_buffer));
-  ASSERT(obj1_first == obj_buffer[0].data->data()[0]);
-  ASSERT(obj2_first == obj_buffer[1].data->data()[0]);
-
-  sleep(1);
-  ARROW_CHECK_OK(client1.Disconnect());
-  ARROW_CHECK_OK(client2.Disconnect());
-
-  PASS();
-}
-
-SUITE(plasma_client_tests) {
-  RUN_TEST(plasma_status_tests);
-  RUN_TEST(plasma_fetch_tests);
-  RUN_TEST(plasma_nonblocking_get_tests);
-  RUN_TEST(plasma_wait_for_objects_tests);
-  RUN_TEST(plasma_get_tests);
-  RUN_TEST(plasma_get_multiple_tests);
-}
-
-GREATEST_MAIN_DEFS();
-
-int main(int argc, char **argv) {
-  GREATEST_MAIN_BEGIN();
-  RUN_SUITE(plasma_client_tests);
-  GREATEST_MAIN_END();
-}
diff --git a/src/plasma/test/manager_tests.cc b/src/plasma/test/manager_tests.cc
deleted file mode 100644
index 6d664165b4b07..0000000000000
--- a/src/plasma/test/manager_tests.cc
+++ /dev/null
@@ -1,313 +0,0 @@
-#include "greatest.h"
-
-#include <assert.h>
-#include <unistd.h>
-#include <poll.h>
-#include <sys/types.h>
-#include <sys/socket.h>
-#include <fcntl.h>
-
-#include <string>
-
-#include "plasma/test-util.h"
-
-#include "common.h"
-#include "test/test_common.h"
-#include "event_loop.h"
-#include "io.h"
-
-#include "../plasma_manager.h"
-#include "plasma/client.h"
-#include "../protocol.h"
-
-namespace fb = plasma::flatbuf;
-
-SUITE(plasma_manager_tests);
-
-const char *plasma_store_socket_name = "/tmp/plasma_store_socket_1";
-const char *plasma_manager_socket_name_format = "/tmp/plasma_manager_socket_%d";
-const char *manager_addr = "127.0.0.1";
-ObjectID object_id;
-
-void wait_for_pollin(int fd) {
-  struct pollfd poll_list[1];
-  poll_list[0].fd = fd;
-  poll_list[0].events = POLLIN;
-  int retval = poll(poll_list, (unsigned long) 1, -1);
-  RAY_CHECK(retval > 0);
-}
-
-int test_done_handler(event_loop *loop, timer_id id, void *context) {
-  event_loop_stop(loop);
-  return AE_NOMORE;
-}
-
-typedef struct {
-  int port;
-  /** Connection to the manager's TCP socket. */
-  int manager_remote_fd;
-  /** Connection to the manager's Unix socket. */
-  int manager_local_fd;
-  int local_store;
-  int manager;
-  PlasmaManagerState *state;
-  event_loop *loop;
-  /* Accept a connection from the local manager on the remote manager. */
-  ClientConnection *write_conn;
-  ClientConnection *read_conn;
-  /* Connect a new client to the local plasma manager and mock a request to an
-   * object. */
-  plasma::PlasmaClient *plasma_client;
-  ClientConnection *client_conn;
-} plasma_mock;
-
-plasma_mock *init_plasma_mock(plasma_mock *remote_mock) {
-  plasma_mock *mock = (plasma_mock *) malloc(sizeof(plasma_mock));
-  /* Start listening on all the ports and initiate the local plasma manager. */
-  mock->port = bind_inet_sock_retry(&mock->manager_remote_fd);
-  mock->local_store = connect_ipc_sock_retry(plasma_store_socket_name, 5, 100);
-  std::string manager_socket_name = bind_ipc_sock_retry(
-      plasma_manager_socket_name_format, &mock->manager_local_fd);
-
-  RAY_CHECK(mock->manager_local_fd >= 0 && mock->local_store >= 0);
-
-  mock->state = PlasmaManagerState_init(plasma_store_socket_name,
-                                        manager_socket_name.c_str(),
-                                        manager_addr, mock->port, NULL, 0);
-  mock->loop = get_event_loop(mock->state);
-  /* Accept a connection from the local manager on the remote manager. */
-  if (remote_mock != NULL) {
-    mock->write_conn =
-        get_manager_connection(remote_mock->state, manager_addr, mock->port);
-    wait_for_pollin(mock->manager_remote_fd);
-    mock->read_conn = ClientConnection_listen(
-        mock->loop, mock->manager_remote_fd, mock->state,
-        plasma::kPlasmaDefaultReleaseDelay);
-  } else {
-    mock->write_conn = NULL;
-    mock->read_conn = NULL;
-  }
-  /* Connect a new client to the local plasma manager and mock a request to an
-   * object. */
-  mock->plasma_client = new plasma::PlasmaClient();
-  ARROW_CHECK_OK(mock->plasma_client->Connect(plasma_store_socket_name,
-                                              manager_socket_name.c_str(), 0));
-  wait_for_pollin(mock->manager_local_fd);
-  mock->client_conn = ClientConnection_listen(
-      mock->loop, mock->manager_local_fd, mock->state, 0);
-  return mock;
-}
-
-void destroy_plasma_mock(plasma_mock *mock) {
-  PlasmaManagerState_free(mock->state);
-  ARROW_CHECK_OK(mock->plasma_client->Disconnect());
-  delete mock->plasma_client;
-  close(mock->local_store);
-  close(mock->manager_local_fd);
-  close(mock->manager_remote_fd);
-  free(mock);
-}
-
-/**
- * This test checks correct behavior of request_transfer in a non-failure
- * scenario. Specifically, when one plasma manager calls request_transfer, the
- * correct remote manager should receive the correct message. The test:
- * - Buffer a transfer request for the remote manager.
- * - Start and stop the event loop to make sure that we send the buffered
- *   request.
- * - Expect to see a fb::MessageType::PlasmaDataRequest message on the remote
- *   manager with the correct object ID.
- */
-TEST request_transfer_test(void) {
-  plasma_mock *local_mock = init_plasma_mock(NULL);
-  plasma_mock *remote_mock = init_plasma_mock(local_mock);
-  std::vector<std::string> manager_vector;
-  manager_vector.push_back(std::string("127.0.0.1:") +
-                           std::to_string(remote_mock->port));
-  call_request_transfer(object_id, manager_vector, local_mock->state);
-  event_loop_add_timer(local_mock->loop,
-                       RayConfig::instance().manager_timeout_milliseconds(),
-                       test_done_handler, local_mock->state);
-  event_loop_run(local_mock->loop);
-  int read_fd = get_client_sock(remote_mock->read_conn);
-  std::vector<uint8_t> request_data;
-  ARROW_CHECK_OK(plasma::PlasmaReceive(
-      read_fd, fb::MessageType::PlasmaDataRequest, &request_data));
-  plasma::ObjectID object_id2;
-  char *address;
-  int port;
-  ARROW_CHECK_OK(plasma::ReadDataRequest(
-      request_data.data(), request_data.size(), &object_id2, &address, &port));
-  ASSERT(object_id == object_id2);
-  free(address);
-  /* Clean up. */
-  destroy_plasma_mock(remote_mock);
-  destroy_plasma_mock(local_mock);
-  PASS();
-}
-
-/**
- * This test checks correct behavior of request_transfer in a scenario when the
- * first manager we try times out. Specifically, when one plasma manager calls
- * request_transfer on a list of remote managers and the first manager isn't
- * reachable, the second remote manager should receive the correct message
- * after the timeout. The test:
- * - Buffer a transfer request for the remote managers.
- * - Start and stop the event loop after a timeout to make sure that we
- *   trigger the timeout on the first manager.
- * - Expect to see a fb::MessageType::PlasmaDataRequest message on the second
- *   remote manager with the correct object ID.
- */
-TEST request_transfer_retry_test(void) {
-  plasma_mock *local_mock = init_plasma_mock(NULL);
-  plasma_mock *remote_mock1 = init_plasma_mock(local_mock);
-  plasma_mock *remote_mock2 = init_plasma_mock(local_mock);
-
-  std::vector<std::string> manager_vector;
-  manager_vector.push_back(std::string("127.0.0.1:") +
-                           std::to_string(remote_mock1->port));
-  manager_vector.push_back(std::string("127.0.0.1:") +
-                           std::to_string(remote_mock2->port));
-
-  call_request_transfer(object_id, manager_vector, local_mock->state);
-  event_loop_add_timer(local_mock->loop,
-                       RayConfig::instance().manager_timeout_milliseconds() * 2,
-                       test_done_handler, local_mock->state);
-  /* Register the fetch timeout handler. This is normally done when the plasma
-   * manager is started. It is needed here so that retries will happen when
-   * fetch requests time out. */
-  event_loop_add_timer(local_mock->loop,
-                       RayConfig::instance().manager_timeout_milliseconds(),
-                       fetch_timeout_handler, local_mock->state);
-  event_loop_run(local_mock->loop);
-
-  int read_fd = get_client_sock(remote_mock2->read_conn);
-  std::vector<uint8_t> request_data;
-  ARROW_CHECK_OK(plasma::PlasmaReceive(
-      read_fd, fb::MessageType::PlasmaDataRequest, &request_data));
-  plasma::ObjectID object_id2;
-  char *address;
-  int port;
-  ARROW_CHECK_OK(plasma::ReadDataRequest(
-      request_data.data(), request_data.size(), &object_id2, &address, &port));
-  free(address);
-  ASSERT(object_id == object_id2);
-  /* Clean up. */
-  destroy_plasma_mock(remote_mock2);
-  destroy_plasma_mock(remote_mock1);
-  destroy_plasma_mock(local_mock);
-  PASS();
-}
-
-/**
- * This test checks correct behavior of reading and writing an object chunk
- * from one manager to another.
- * - Write a one-chunk object from the local to the remote manager.
- * - Read the object chunk on the remote manager.
- * - Expect to see the same data.
- */
-TEST read_write_object_chunk_test(void) {
-  plasma_mock *local_mock = init_plasma_mock(NULL);
-  plasma_mock *remote_mock = init_plasma_mock(local_mock);
-  /* Create a mock object buffer to transfer. */
-  const char *data = "Hello world!";
-  const int data_size = strlen(data) + 1;
-  const int metadata_size = 0;
-  PlasmaRequestBuffer remote_buf;
-  remote_buf.type = fb::MessageType::PlasmaDataReply;
-  remote_buf.object_id = object_id;
-  remote_buf.data = (uint8_t *) data;
-  remote_buf.data_size = data_size;
-  remote_buf.metadata = (uint8_t *) data + data_size;
-  remote_buf.metadata_size = metadata_size;
-  PlasmaRequestBuffer local_buf;
-  local_buf.object_id = object_id;
-  local_buf.data_size = data_size;
-  local_buf.metadata_size = metadata_size;
-  local_buf.data = (uint8_t *) malloc(data_size);
-  /* The test:
-   * - Write the object data from the remote manager to the local.
-   * - Read the object data on the local manager.
-   * - Check that the data matches.
-   */
-  ClientConnection_start_request(remote_mock->write_conn);
-  write_object_chunk(remote_mock->write_conn, &remote_buf);
-  ASSERT(ClientConnection_request_finished(remote_mock->write_conn));
-  /* Wait until the data is ready to be read. */
-  wait_for_pollin(get_client_sock(remote_mock->read_conn));
-  /* Read the data. */
-  ClientConnection_start_request(remote_mock->read_conn);
-  int err = read_object_chunk(remote_mock->read_conn, &local_buf);
-  ASSERT_EQ(err, 0);
-  ASSERT(ClientConnection_request_finished(remote_mock->read_conn));
-  ASSERT_EQ(memcmp(remote_buf.data, local_buf.data, data_size), 0);
-  /* Clean up. */
-  free(local_buf.data);
-  destroy_plasma_mock(remote_mock);
-  destroy_plasma_mock(local_mock);
-  PASS();
-}
-
-TEST object_notifications_test(void) {
-  plasma_mock *local_mock = init_plasma_mock(NULL);
-  /* Open a non-blocking socket pair to mock the object notifications from the
-   * plasma store. */
-  int fd[2];
-  socketpair(AF_UNIX, SOCK_STREAM, 0, fd);
-  int flags = fcntl(fd[1], F_GETFL, 0);
-  RAY_CHECK(fcntl(fd[1], F_SETFL, flags | O_NONBLOCK) == 0);
-
-  ObjectID object_id = plasma::random_object_id();
-  fb::ObjectInfoT info;
-  info.object_id = object_id.binary();
-  info.data_size = 10;
-  info.metadata_size = 1;
-  info.create_time = 0;
-  info.construct_duration = 0;
-  info.digest = std::string("0");
-  info.is_deletion = false;
-
-  /* Check that the object is not local at first. */
-  bool is_local = is_object_local(local_mock->state, object_id);
-  ASSERT(!is_local);
-
-  /* Check that the object is local after receiving an object notification. */
-  auto notification = plasma::CreateObjectInfoBuffer(&info);
-  int64_t size = *((int64_t *) notification.get());
-  send(fd[1], notification.get(), sizeof(int64_t) + size, 0);
-  process_object_notification(local_mock->loop, fd[0], local_mock->state, 0);
-  is_local = is_object_local(local_mock->state, object_id);
-  ASSERT(is_local);
-
-  /* Check that the object is not local after receiving a notification about
-   * the object deletion. */
-  info.is_deletion = true;
-  notification = plasma::CreateObjectInfoBuffer(&info);
-  size = *((int64_t *) notification.get());
-  send(fd[1], notification.get(), sizeof(int64_t) + size, 0);
-  process_object_notification(local_mock->loop, fd[0], local_mock->state, 0);
-  is_local = is_object_local(local_mock->state, object_id);
-  ASSERT(!is_local);
-
-  /* Clean up. */
-  close(fd[0]);
-  close(fd[1]);
-  destroy_plasma_mock(local_mock);
-  PASS();
-}
-
-SUITE(plasma_manager_tests) {
-  memset(&object_id, 1, sizeof(object_id));
-  RUN_TEST(request_transfer_test);
-  RUN_TEST(request_transfer_retry_test);
-  RUN_TEST(read_write_object_chunk_test);
-  RUN_TEST(object_notifications_test);
-}
-
-GREATEST_MAIN_DEFS();
-
-int main(int argc, char **argv) {
-  GREATEST_MAIN_BEGIN();
-  RUN_SUITE(plasma_manager_tests);
-  GREATEST_MAIN_END();
-}
diff --git a/src/plasma/test/run_tests.sh b/src/plasma/test/run_tests.sh
deleted file mode 100644
index 07001a65daf79..0000000000000
--- a/src/plasma/test/run_tests.sh
+++ /dev/null
@@ -1,59 +0,0 @@
-#!/usr/bin/env bash
-
-# Cause the script to exit if a single command fails.
-set -e
-
-./src/plasma/plasma_store_server -s /tmp/plasma_store_socket_1 -m 0 &
-sleep 1
-./src/plasma/manager_tests
-killall plasma_store_server
-
-LaunchRedis() {
-    port=$1
-    if [[ "${RAY_USE_NEW_GCS}" = "on" ]]; then
-        ./src/credis/redis/src/redis-server \
-            --loglevel warning \
-            --loadmodule ./src/credis/build/src/libmember.so \
-            --loadmodule ./src/common/redis_module/libray_redis_module.so \
-            --port $port &
-    else
-        ./src/common/thirdparty/redis/src/redis-server \
-            --loglevel warning \
-            --loadmodule ./src/common/redis_module/libray_redis_module.so \
-            --port $port &
-    fi
-}
-
-# Start the Redis shards.
-LaunchRedis 6379
-redis_pid1=$!
-LaunchRedis 6380
-redis_pid2=$!
-sleep 1s
-
-# Flush the redis server
-./src/common/thirdparty/redis/src/redis-cli flushall
-# Register the shard location with the primary shard.
-./src/common/thirdparty/redis/src/redis-cli set NumRedisShards 1
-./src/common/thirdparty/redis/src/redis-cli rpush RedisShards 127.0.0.1:6380
-sleep 1
-./src/plasma/plasma_store_server -s /tmp/store1 -m 1000000000 &
-plasma1_pid=$!
-./src/plasma/plasma_manager -m /tmp/manager1 -s /tmp/store1 -h 127.0.0.1 -p 11111 -r 127.0.0.1:6379 &
-plasma2_pid=$!
-./src/plasma/plasma_store_server -s /tmp/store2 -m 1000000000 &
-plasma3_pid=$!
-./src/plasma/plasma_manager -m /tmp/manager2 -s /tmp/store2 -h 127.0.0.1 -p 22222 -r 127.0.0.1:6379 &
-plasma4_pid=$!
-sleep 1
-
-./src/plasma/client_tests
-
-kill $plasma4_pid
-kill $plasma3_pid
-kill $plasma2_pid
-kill $plasma1_pid
-kill $redis_pid1
-wait $redis_pid1
-kill $redis_pid2
-wait $redis_pid2
diff --git a/src/plasma/test/run_valgrind.sh b/src/plasma/test/run_valgrind.sh
deleted file mode 100644
index a3dfb157475eb..0000000000000
--- a/src/plasma/test/run_valgrind.sh
+++ /dev/null
@@ -1,11 +0,0 @@
-#!/usr/bin/env bash
-
-set -x
-
-# Cause the script to exit if a single command fails.
-set -e
-
-./src/plasma/plasma_store_server -s /tmp/plasma_store_socket_1 -m 0 &
-sleep 1
-valgrind --track-origins=yes --leak-check=full --show-leak-kinds=all --leak-check-heuristics=stdstring --error-exitcode=1 ./src/plasma/manager_tests
-killall plasma_store_server
diff --git a/src/plasma/thirdparty/ae/ae.c b/src/plasma/thirdparty/ae/ae.c
deleted file mode 100644
index e66808a81466d..0000000000000
--- a/src/plasma/thirdparty/ae/ae.c
+++ /dev/null
@@ -1,465 +0,0 @@
-/* A simple event-driven programming library. Originally I wrote this code
- * for the Jim's event-loop (Jim is a Tcl interpreter) but later translated
- * it in form of a library for easy reuse.
- *
- * Copyright (c) 2006-2010, Salvatore Sanfilippo <antirez at gmail dot com>
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- *   * Redistributions of source code must retain the above copyright notice,
- *     this list of conditions and the following disclaimer.
- *   * Redistributions in binary form must reproduce the above copyright
- *     notice, this list of conditions and the following disclaimer in the
- *     documentation and/or other materials provided with the distribution.
- *   * Neither the name of Redis nor the names of its contributors may be used
- *     to endorse or promote products derived from this software without
- *     specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
- * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
- * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
- * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
- * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
- * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
- * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
- * POSSIBILITY OF SUCH DAMAGE.
- */
-
-#include <stdio.h>
-#include <sys/time.h>
-#include <sys/types.h>
-#include <unistd.h>
-#include <stdlib.h>
-#include <poll.h>
-#include <string.h>
-#include <time.h>
-#include <errno.h>
-
-#include "ae.h"
-#include "zmalloc.h"
-#include "config.h"
-
-/* Include the best multiplexing layer supported by this system.
- * The following should be ordered by performances, descending. */
-#ifdef HAVE_EVPORT
-#include "ae_evport.c"
-#else
-    #ifdef HAVE_EPOLL
-    #include "ae_epoll.c"
-    #else
-        #ifdef HAVE_KQUEUE
-        #include "ae_kqueue.c"
-        #else
-        #include "ae_select.c"
-        #endif
-    #endif
-#endif
-
-aeEventLoop *aeCreateEventLoop(int setsize) {
-    aeEventLoop *eventLoop;
-    int i;
-
-    if ((eventLoop = zmalloc(sizeof(*eventLoop))) == NULL) goto err;
-    eventLoop->events = zmalloc(sizeof(aeFileEvent)*setsize);
-    eventLoop->fired = zmalloc(sizeof(aeFiredEvent)*setsize);
-    if (eventLoop->events == NULL || eventLoop->fired == NULL) goto err;
-    eventLoop->setsize = setsize;
-    eventLoop->lastTime = time(NULL);
-    eventLoop->timeEventHead = NULL;
-    eventLoop->timeEventNextId = 0;
-    eventLoop->stop = 0;
-    eventLoop->maxfd = -1;
-    eventLoop->beforesleep = NULL;
-    if (aeApiCreate(eventLoop) == -1) goto err;
-    /* Events with mask == AE_NONE are not set. So let's initialize the
-     * vector with it. */
-    for (i = 0; i < setsize; i++)
-        eventLoop->events[i].mask = AE_NONE;
-    return eventLoop;
-
-err:
-    if (eventLoop) {
-        zfree(eventLoop->events);
-        zfree(eventLoop->fired);
-        zfree(eventLoop);
-    }
-    return NULL;
-}
-
-/* Return the current set size. */
-int aeGetSetSize(aeEventLoop *eventLoop) {
-    return eventLoop->setsize;
-}
-
-/* Resize the maximum set size of the event loop.
- * If the requested set size is smaller than the current set size, but
- * there is already a file descriptor in use that is >= the requested
- * set size minus one, AE_ERR is returned and the operation is not
- * performed at all.
- *
- * Otherwise AE_OK is returned and the operation is successful. */
-int aeResizeSetSize(aeEventLoop *eventLoop, int setsize) {
-    int i;
-
-    if (setsize == eventLoop->setsize) return AE_OK;
-    if (eventLoop->maxfd >= setsize) return AE_ERR;
-    if (aeApiResize(eventLoop,setsize) == -1) return AE_ERR;
-
-    eventLoop->events = zrealloc(eventLoop->events,sizeof(aeFileEvent)*setsize);
-    eventLoop->fired = zrealloc(eventLoop->fired,sizeof(aeFiredEvent)*setsize);
-    eventLoop->setsize = setsize;
-
-    /* Make sure that if we created new slots, they are initialized with
-     * an AE_NONE mask. */
-    for (i = eventLoop->maxfd+1; i < setsize; i++)
-        eventLoop->events[i].mask = AE_NONE;
-    return AE_OK;
-}
-
-void aeDeleteEventLoop(aeEventLoop *eventLoop) {
-    aeApiFree(eventLoop);
-    zfree(eventLoop->events);
-    zfree(eventLoop->fired);
-    zfree(eventLoop);
-}
-
-void aeStop(aeEventLoop *eventLoop) {
-    eventLoop->stop = 1;
-}
-
-int aeCreateFileEvent(aeEventLoop *eventLoop, int fd, int mask,
-        aeFileProc *proc, void *clientData)
-{
-    if (fd >= eventLoop->setsize) {
-        errno = ERANGE;
-        return AE_ERR;
-    }
-    aeFileEvent *fe = &eventLoop->events[fd];
-
-    if (aeApiAddEvent(eventLoop, fd, mask) == -1)
-        return AE_ERR;
-    fe->mask |= mask;
-    if (mask & AE_READABLE) fe->rfileProc = proc;
-    if (mask & AE_WRITABLE) fe->wfileProc = proc;
-    fe->clientData = clientData;
-    if (fd > eventLoop->maxfd)
-        eventLoop->maxfd = fd;
-    return AE_OK;
-}
-
-void aeDeleteFileEvent(aeEventLoop *eventLoop, int fd, int mask)
-{
-    if (fd >= eventLoop->setsize) return;
-    aeFileEvent *fe = &eventLoop->events[fd];
-    if (fe->mask == AE_NONE) return;
-
-    aeApiDelEvent(eventLoop, fd, mask);
-    fe->mask = fe->mask & (~mask);
-    if (fd == eventLoop->maxfd && fe->mask == AE_NONE) {
-        /* Update the max fd */
-        int j;
-
-        for (j = eventLoop->maxfd-1; j >= 0; j--)
-            if (eventLoop->events[j].mask != AE_NONE) break;
-        eventLoop->maxfd = j;
-    }
-}
-
-int aeGetFileEvents(aeEventLoop *eventLoop, int fd) {
-    if (fd >= eventLoop->setsize) return 0;
-    aeFileEvent *fe = &eventLoop->events[fd];
-
-    return fe->mask;
-}
-
-static void aeGetTime(long *seconds, long *milliseconds)
-{
-    struct timeval tv;
-
-    gettimeofday(&tv, NULL);
-    *seconds = tv.tv_sec;
-    *milliseconds = tv.tv_usec/1000;
-}
-
-static void aeAddMillisecondsToNow(long long milliseconds, long *sec, long *ms) {
-    long cur_sec, cur_ms, when_sec, when_ms;
-
-    aeGetTime(&cur_sec, &cur_ms);
-    when_sec = cur_sec + milliseconds/1000;
-    when_ms = cur_ms + milliseconds%1000;
-    if (when_ms >= 1000) {
-        when_sec ++;
-        when_ms -= 1000;
-    }
-    *sec = when_sec;
-    *ms = when_ms;
-}
-
-long long aeCreateTimeEvent(aeEventLoop *eventLoop, long long milliseconds,
-        aeTimeProc *proc, void *clientData,
-        aeEventFinalizerProc *finalizerProc)
-{
-    long long id = eventLoop->timeEventNextId++;
-    aeTimeEvent *te;
-
-    te = zmalloc(sizeof(*te));
-    if (te == NULL) return AE_ERR;
-    te->id = id;
-    aeAddMillisecondsToNow(milliseconds,&te->when_sec,&te->when_ms);
-    te->timeProc = proc;
-    te->finalizerProc = finalizerProc;
-    te->clientData = clientData;
-    te->next = eventLoop->timeEventHead;
-    eventLoop->timeEventHead = te;
-    return id;
-}
-
-int aeDeleteTimeEvent(aeEventLoop *eventLoop, long long id)
-{
-    aeTimeEvent *te = eventLoop->timeEventHead;
-    while(te) {
-        if (te->id == id) {
-            te->id = AE_DELETED_EVENT_ID;
-            return AE_OK;
-        }
-        te = te->next;
-    }
-    return AE_ERR; /* NO event with the specified ID found */
-}
-
-/* Search the first timer to fire.
- * This operation is useful to know how many time the select can be
- * put in sleep without to delay any event.
- * If there are no timers NULL is returned.
- *
- * Note that's O(N) since time events are unsorted.
- * Possible optimizations (not needed by Redis so far, but...):
- * 1) Insert the event in order, so that the nearest is just the head.
- *    Much better but still insertion or deletion of timers is O(N).
- * 2) Use a skiplist to have this operation as O(1) and insertion as O(log(N)).
- */
-static aeTimeEvent *aeSearchNearestTimer(aeEventLoop *eventLoop)
-{
-    aeTimeEvent *te = eventLoop->timeEventHead;
-    aeTimeEvent *nearest = NULL;
-
-    while(te) {
-        if (!nearest || te->when_sec < nearest->when_sec ||
-                (te->when_sec == nearest->when_sec &&
-                 te->when_ms < nearest->when_ms))
-            nearest = te;
-        te = te->next;
-    }
-    return nearest;
-}
-
-/* Process time events */
-static int processTimeEvents(aeEventLoop *eventLoop) {
-    int processed = 0;
-    aeTimeEvent *te, *prev;
-    long long maxId;
-    time_t now = time(NULL);
-
-    /* If the system clock is moved to the future, and then set back to the
-     * right value, time events may be delayed in a random way. Often this
-     * means that scheduled operations will not be performed soon enough.
-     *
-     * Here we try to detect system clock skews, and force all the time
-     * events to be processed ASAP when this happens: the idea is that
-     * processing events earlier is less dangerous than delaying them
-     * indefinitely, and practice suggests it is. */
-    if (now < eventLoop->lastTime) {
-        te = eventLoop->timeEventHead;
-        while(te) {
-            te->when_sec = 0;
-            te = te->next;
-        }
-    }
-    eventLoop->lastTime = now;
-
-    prev = NULL;
-    te = eventLoop->timeEventHead;
-    maxId = eventLoop->timeEventNextId-1;
-    while(te) {
-        long now_sec, now_ms;
-        long long id;
-
-        /* Remove events scheduled for deletion. */
-        if (te->id == AE_DELETED_EVENT_ID) {
-            aeTimeEvent *next = te->next;
-            if (prev == NULL)
-                eventLoop->timeEventHead = te->next;
-            else
-                prev->next = te->next;
-            if (te->finalizerProc)
-                te->finalizerProc(eventLoop, te->clientData);
-            zfree(te);
-            te = next;
-            continue;
-        }
-
-        /* Make sure we don't process time events created by time events in
-         * this iteration. Note that this check is currently useless: we always
-         * add new timers on the head, however if we change the implementation
-         * detail, this check may be useful again: we keep it here for future
-         * defense. */
-        if (te->id > maxId) {
-            te = te->next;
-            continue;
-        }
-        aeGetTime(&now_sec, &now_ms);
-        if (now_sec > te->when_sec ||
-            (now_sec == te->when_sec && now_ms >= te->when_ms))
-        {
-            int retval;
-
-            id = te->id;
-            retval = te->timeProc(eventLoop, id, te->clientData);
-            processed++;
-            if (retval != AE_NOMORE) {
-                aeAddMillisecondsToNow(retval,&te->when_sec,&te->when_ms);
-            } else {
-                te->id = AE_DELETED_EVENT_ID;
-            }
-        }
-        prev = te;
-        te = te->next;
-    }
-    return processed;
-}
-
-/* Process every pending time event, then every pending file event
- * (that may be registered by time event callbacks just processed).
- * Without special flags the function sleeps until some file event
- * fires, or when the next time event occurs (if any).
- *
- * If flags is 0, the function does nothing and returns.
- * if flags has AE_ALL_EVENTS set, all the kind of events are processed.
- * if flags has AE_FILE_EVENTS set, file events are processed.
- * if flags has AE_TIME_EVENTS set, time events are processed.
- * if flags has AE_DONT_WAIT set the function returns ASAP until all
- * the events that's possible to process without to wait are processed.
- *
- * The function returns the number of events processed. */
-int aeProcessEvents(aeEventLoop *eventLoop, int flags)
-{
-    int processed = 0, numevents;
-
-    /* Nothing to do? return ASAP */
-    if (!(flags & AE_TIME_EVENTS) && !(flags & AE_FILE_EVENTS)) return 0;
-
-    /* Note that we want call select() even if there are no
-     * file events to process as long as we want to process time
-     * events, in order to sleep until the next time event is ready
-     * to fire. */
-    if (eventLoop->maxfd != -1 ||
-        ((flags & AE_TIME_EVENTS) && !(flags & AE_DONT_WAIT))) {
-        int j;
-        aeTimeEvent *shortest = NULL;
-        struct timeval tv, *tvp;
-
-        if (flags & AE_TIME_EVENTS && !(flags & AE_DONT_WAIT))
-            shortest = aeSearchNearestTimer(eventLoop);
-        if (shortest) {
-            long now_sec, now_ms;
-
-            aeGetTime(&now_sec, &now_ms);
-            tvp = &tv;
-
-            /* How many milliseconds we need to wait for the next
-             * time event to fire? */
-            long long ms =
-                (shortest->when_sec - now_sec)*1000 +
-                shortest->when_ms - now_ms;
-
-            if (ms > 0) {
-                tvp->tv_sec = ms/1000;
-                tvp->tv_usec = (ms % 1000)*1000;
-            } else {
-                tvp->tv_sec = 0;
-                tvp->tv_usec = 0;
-            }
-        } else {
-            /* If we have to check for events but need to return
-             * ASAP because of AE_DONT_WAIT we need to set the timeout
-             * to zero */
-            if (flags & AE_DONT_WAIT) {
-                tv.tv_sec = tv.tv_usec = 0;
-                tvp = &tv;
-            } else {
-                /* Otherwise we can block */
-                tvp = NULL; /* wait forever */
-            }
-        }
-
-        numevents = aeApiPoll(eventLoop, tvp);
-        for (j = 0; j < numevents; j++) {
-            aeFileEvent *fe = &eventLoop->events[eventLoop->fired[j].fd];
-            int mask = eventLoop->fired[j].mask;
-            int fd = eventLoop->fired[j].fd;
-            int rfired = 0;
-
-	    /* note the fe->mask & mask & ... code: maybe an already processed
-             * event removed an element that fired and we still didn't
-             * processed, so we check if the event is still valid. */
-            if (fe->mask & mask & AE_READABLE) {
-                rfired = 1;
-                fe->rfileProc(eventLoop,fd,fe->clientData,mask);
-            }
-            if (fe->mask & mask & AE_WRITABLE) {
-                if (!rfired || fe->wfileProc != fe->rfileProc)
-                    fe->wfileProc(eventLoop,fd,fe->clientData,mask);
-            }
-            processed++;
-        }
-    }
-    /* Check time events */
-    if (flags & AE_TIME_EVENTS)
-        processed += processTimeEvents(eventLoop);
-
-    return processed; /* return the number of processed file/time events */
-}
-
-/* Wait for milliseconds until the given file descriptor becomes
- * writable/readable/exception */
-int aeWait(int fd, int mask, long long milliseconds) {
-    struct pollfd pfd;
-    int retmask = 0, retval;
-
-    memset(&pfd, 0, sizeof(pfd));
-    pfd.fd = fd;
-    if (mask & AE_READABLE) pfd.events |= POLLIN;
-    if (mask & AE_WRITABLE) pfd.events |= POLLOUT;
-
-    if ((retval = poll(&pfd, 1, milliseconds))== 1) {
-        if (pfd.revents & POLLIN) retmask |= AE_READABLE;
-        if (pfd.revents & POLLOUT) retmask |= AE_WRITABLE;
-	if (pfd.revents & POLLERR) retmask |= AE_WRITABLE;
-        if (pfd.revents & POLLHUP) retmask |= AE_WRITABLE;
-        return retmask;
-    } else {
-        return retval;
-    }
-}
-
-void aeMain(aeEventLoop *eventLoop) {
-    eventLoop->stop = 0;
-    while (!eventLoop->stop) {
-        if (eventLoop->beforesleep != NULL)
-            eventLoop->beforesleep(eventLoop);
-        aeProcessEvents(eventLoop, AE_ALL_EVENTS);
-    }
-}
-
-char *aeGetApiName(void) {
-    return aeApiName();
-}
-
-void aeSetBeforeSleepProc(aeEventLoop *eventLoop, aeBeforeSleepProc *beforesleep) {
-    eventLoop->beforesleep = beforesleep;
-}
diff --git a/src/plasma/thirdparty/ae/ae.h b/src/plasma/thirdparty/ae/ae.h
deleted file mode 100644
index 827c4c9e4e59e..0000000000000
--- a/src/plasma/thirdparty/ae/ae.h
+++ /dev/null
@@ -1,123 +0,0 @@
-/* A simple event-driven programming library. Originally I wrote this code
- * for the Jim's event-loop (Jim is a Tcl interpreter) but later translated
- * it in form of a library for easy reuse.
- *
- * Copyright (c) 2006-2012, Salvatore Sanfilippo <antirez at gmail dot com>
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- *   * Redistributions of source code must retain the above copyright notice,
- *     this list of conditions and the following disclaimer.
- *   * Redistributions in binary form must reproduce the above copyright
- *     notice, this list of conditions and the following disclaimer in the
- *     documentation and/or other materials provided with the distribution.
- *   * Neither the name of Redis nor the names of its contributors may be used
- *     to endorse or promote products derived from this software without
- *     specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
- * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
- * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
- * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
- * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
- * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
- * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
- * POSSIBILITY OF SUCH DAMAGE.
- */
-
-#ifndef __AE_H__
-#define __AE_H__
-
-#include <time.h>
-
-#define AE_OK 0
-#define AE_ERR -1
-
-#define AE_NONE 0
-#define AE_READABLE 1
-#define AE_WRITABLE 2
-
-#define AE_FILE_EVENTS 1
-#define AE_TIME_EVENTS 2
-#define AE_ALL_EVENTS (AE_FILE_EVENTS|AE_TIME_EVENTS)
-#define AE_DONT_WAIT 4
-
-#define AE_NOMORE -1
-#define AE_DELETED_EVENT_ID -1
-
-/* Macros */
-#define AE_NOTUSED(V) ((void) V)
-
-struct aeEventLoop;
-
-/* Types and data structures */
-typedef void aeFileProc(struct aeEventLoop *eventLoop, int fd, void *clientData, int mask);
-typedef int aeTimeProc(struct aeEventLoop *eventLoop, long long id, void *clientData);
-typedef void aeEventFinalizerProc(struct aeEventLoop *eventLoop, void *clientData);
-typedef void aeBeforeSleepProc(struct aeEventLoop *eventLoop);
-
-/* File event structure */
-typedef struct aeFileEvent {
-    int mask; /* one of AE_(READABLE|WRITABLE) */
-    aeFileProc *rfileProc;
-    aeFileProc *wfileProc;
-    void *clientData;
-} aeFileEvent;
-
-/* Time event structure */
-typedef struct aeTimeEvent {
-    long long id; /* time event identifier. */
-    long when_sec; /* seconds */
-    long when_ms; /* milliseconds */
-    aeTimeProc *timeProc;
-    aeEventFinalizerProc *finalizerProc;
-    void *clientData;
-    struct aeTimeEvent *next;
-} aeTimeEvent;
-
-/* A fired event */
-typedef struct aeFiredEvent {
-    int fd;
-    int mask;
-} aeFiredEvent;
-
-/* State of an event based program */
-typedef struct aeEventLoop {
-    int maxfd;   /* highest file descriptor currently registered */
-    int setsize; /* max number of file descriptors tracked */
-    long long timeEventNextId;
-    time_t lastTime;     /* Used to detect system clock skew */
-    aeFileEvent *events; /* Registered events */
-    aeFiredEvent *fired; /* Fired events */
-    aeTimeEvent *timeEventHead;
-    int stop;
-    void *apidata; /* This is used for polling API specific data */
-    aeBeforeSleepProc *beforesleep;
-} aeEventLoop;
-
-/* Prototypes */
-aeEventLoop *aeCreateEventLoop(int setsize);
-void aeDeleteEventLoop(aeEventLoop *eventLoop);
-void aeStop(aeEventLoop *eventLoop);
-int aeCreateFileEvent(aeEventLoop *eventLoop, int fd, int mask,
-        aeFileProc *proc, void *clientData);
-void aeDeleteFileEvent(aeEventLoop *eventLoop, int fd, int mask);
-int aeGetFileEvents(aeEventLoop *eventLoop, int fd);
-long long aeCreateTimeEvent(aeEventLoop *eventLoop, long long milliseconds,
-        aeTimeProc *proc, void *clientData,
-        aeEventFinalizerProc *finalizerProc);
-int aeDeleteTimeEvent(aeEventLoop *eventLoop, long long id);
-int aeProcessEvents(aeEventLoop *eventLoop, int flags);
-int aeWait(int fd, int mask, long long milliseconds);
-void aeMain(aeEventLoop *eventLoop);
-char *aeGetApiName(void);
-void aeSetBeforeSleepProc(aeEventLoop *eventLoop, aeBeforeSleepProc *beforesleep);
-int aeGetSetSize(aeEventLoop *eventLoop);
-int aeResizeSetSize(aeEventLoop *eventLoop, int setsize);
-
-#endif
diff --git a/src/plasma/thirdparty/ae/ae_epoll.c b/src/plasma/thirdparty/ae/ae_epoll.c
deleted file mode 100644
index 410aac70dc5af..0000000000000
--- a/src/plasma/thirdparty/ae/ae_epoll.c
+++ /dev/null
@@ -1,135 +0,0 @@
-/* Linux epoll(2) based ae.c module
- *
- * Copyright (c) 2009-2012, Salvatore Sanfilippo <antirez at gmail dot com>
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- *   * Redistributions of source code must retain the above copyright notice,
- *     this list of conditions and the following disclaimer.
- *   * Redistributions in binary form must reproduce the above copyright
- *     notice, this list of conditions and the following disclaimer in the
- *     documentation and/or other materials provided with the distribution.
- *   * Neither the name of Redis nor the names of its contributors may be used
- *     to endorse or promote products derived from this software without
- *     specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
- * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
- * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
- * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
- * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
- * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
- * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
- * POSSIBILITY OF SUCH DAMAGE.
- */
-
-
-#include <sys/epoll.h>
-
-typedef struct aeApiState {
-    int epfd;
-    struct epoll_event *events;
-} aeApiState;
-
-static int aeApiCreate(aeEventLoop *eventLoop) {
-    aeApiState *state = zmalloc(sizeof(aeApiState));
-
-    if (!state) return -1;
-    state->events = zmalloc(sizeof(struct epoll_event)*eventLoop->setsize);
-    if (!state->events) {
-        zfree(state);
-        return -1;
-    }
-    state->epfd = epoll_create(1024); /* 1024 is just a hint for the kernel */
-    if (state->epfd == -1) {
-        zfree(state->events);
-        zfree(state);
-        return -1;
-    }
-    eventLoop->apidata = state;
-    return 0;
-}
-
-static int aeApiResize(aeEventLoop *eventLoop, int setsize) {
-    aeApiState *state = eventLoop->apidata;
-
-    state->events = zrealloc(state->events, sizeof(struct epoll_event)*setsize);
-    return 0;
-}
-
-static void aeApiFree(aeEventLoop *eventLoop) {
-    aeApiState *state = eventLoop->apidata;
-
-    close(state->epfd);
-    zfree(state->events);
-    zfree(state);
-}
-
-static int aeApiAddEvent(aeEventLoop *eventLoop, int fd, int mask) {
-    aeApiState *state = eventLoop->apidata;
-    struct epoll_event ee = {0}; /* avoid valgrind warning */
-    /* If the fd was already monitored for some event, we need a MOD
-     * operation. Otherwise we need an ADD operation. */
-    int op = eventLoop->events[fd].mask == AE_NONE ?
-            EPOLL_CTL_ADD : EPOLL_CTL_MOD;
-
-    ee.events = 0;
-    mask |= eventLoop->events[fd].mask; /* Merge old events */
-    if (mask & AE_READABLE) ee.events |= EPOLLIN;
-    if (mask & AE_WRITABLE) ee.events |= EPOLLOUT;
-    ee.data.fd = fd;
-    if (epoll_ctl(state->epfd,op,fd,&ee) == -1) return -1;
-    return 0;
-}
-
-static void aeApiDelEvent(aeEventLoop *eventLoop, int fd, int delmask) {
-    aeApiState *state = eventLoop->apidata;
-    struct epoll_event ee = {0}; /* avoid valgrind warning */
-    int mask = eventLoop->events[fd].mask & (~delmask);
-
-    ee.events = 0;
-    if (mask & AE_READABLE) ee.events |= EPOLLIN;
-    if (mask & AE_WRITABLE) ee.events |= EPOLLOUT;
-    ee.data.fd = fd;
-    if (mask != AE_NONE) {
-        epoll_ctl(state->epfd,EPOLL_CTL_MOD,fd,&ee);
-    } else {
-        /* Note, Kernel < 2.6.9 requires a non null event pointer even for
-         * EPOLL_CTL_DEL. */
-        epoll_ctl(state->epfd,EPOLL_CTL_DEL,fd,&ee);
-    }
-}
-
-static int aeApiPoll(aeEventLoop *eventLoop, struct timeval *tvp) {
-    aeApiState *state = eventLoop->apidata;
-    int retval, numevents = 0;
-
-    retval = epoll_wait(state->epfd,state->events,eventLoop->setsize,
-            tvp ? (tvp->tv_sec*1000 + tvp->tv_usec/1000) : -1);
-    if (retval > 0) {
-        int j;
-
-        numevents = retval;
-        for (j = 0; j < numevents; j++) {
-            int mask = 0;
-            struct epoll_event *e = state->events+j;
-
-            if (e->events & EPOLLIN) mask |= AE_READABLE;
-            if (e->events & EPOLLOUT) mask |= AE_WRITABLE;
-            if (e->events & EPOLLERR) mask |= AE_WRITABLE;
-            if (e->events & EPOLLHUP) mask |= AE_WRITABLE;
-            eventLoop->fired[j].fd = e->data.fd;
-            eventLoop->fired[j].mask = mask;
-        }
-    }
-    return numevents;
-}
-
-static char *aeApiName(void) {
-    return "epoll";
-}
diff --git a/src/plasma/thirdparty/ae/ae_evport.c b/src/plasma/thirdparty/ae/ae_evport.c
deleted file mode 100644
index 5c317becb6f7d..0000000000000
--- a/src/plasma/thirdparty/ae/ae_evport.c
+++ /dev/null
@@ -1,320 +0,0 @@
-/* ae.c module for illumos event ports.
- *
- * Copyright (c) 2012, Joyent, Inc. All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- *   * Redistributions of source code must retain the above copyright notice,
- *     this list of conditions and the following disclaimer.
- *   * Redistributions in binary form must reproduce the above copyright
- *     notice, this list of conditions and the following disclaimer in the
- *     documentation and/or other materials provided with the distribution.
- *   * Neither the name of Redis nor the names of its contributors may be used
- *     to endorse or promote products derived from this software without
- *     specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
- * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
- * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
- * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
- * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
- * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
- * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
- * POSSIBILITY OF SUCH DAMAGE.
- */
-
-
-#include <assert.h>
-#include <errno.h>
-#include <port.h>
-#include <poll.h>
-
-#include <sys/types.h>
-#include <sys/time.h>
-
-#include <stdio.h>
-
-static int evport_debug = 0;
-
-/*
- * This file implements the ae API using event ports, present on Solaris-based
- * systems since Solaris 10.  Using the event port interface, we associate file
- * descriptors with the port.  Each association also includes the set of poll(2)
- * events that the consumer is interested in (e.g., POLLIN and POLLOUT).
- *
- * There's one tricky piece to this implementation: when we return events via
- * aeApiPoll, the corresponding file descriptors become dissociated from the
- * port.  This is necessary because poll events are level-triggered, so if the
- * fd didn't become dissociated, it would immediately fire another event since
- * the underlying state hasn't changed yet.  We must re-associate the file
- * descriptor, but only after we know that our caller has actually read from it.
- * The ae API does not tell us exactly when that happens, but we do know that
- * it must happen by the time aeApiPoll is called again.  Our solution is to
- * keep track of the last fds returned by aeApiPoll and re-associate them next
- * time aeApiPoll is invoked.
- *
- * To summarize, in this module, each fd association is EITHER (a) represented
- * only via the in-kernel association OR (b) represented by pending_fds and
- * pending_masks.  (b) is only true for the last fds we returned from aeApiPoll,
- * and only until we enter aeApiPoll again (at which point we restore the
- * in-kernel association).
- */
-#define MAX_EVENT_BATCHSZ 512
-
-typedef struct aeApiState {
-    int     portfd;                             /* event port */
-    int     npending;                           /* # of pending fds */
-    int     pending_fds[MAX_EVENT_BATCHSZ];     /* pending fds */
-    int     pending_masks[MAX_EVENT_BATCHSZ];   /* pending fds' masks */
-} aeApiState;
-
-static int aeApiCreate(aeEventLoop *eventLoop) {
-    int i;
-    aeApiState *state = zmalloc(sizeof(aeApiState));
-    if (!state) return -1;
-
-    state->portfd = port_create();
-    if (state->portfd == -1) {
-        zfree(state);
-        return -1;
-    }
-
-    state->npending = 0;
-
-    for (i = 0; i < MAX_EVENT_BATCHSZ; i++) {
-        state->pending_fds[i] = -1;
-        state->pending_masks[i] = AE_NONE;
-    }
-
-    eventLoop->apidata = state;
-    return 0;
-}
-
-static int aeApiResize(aeEventLoop *eventLoop, int setsize) {
-    /* Nothing to resize here. */
-    return 0;
-}
-
-static void aeApiFree(aeEventLoop *eventLoop) {
-    aeApiState *state = eventLoop->apidata;
-
-    close(state->portfd);
-    zfree(state);
-}
-
-static int aeApiLookupPending(aeApiState *state, int fd) {
-    int i;
-
-    for (i = 0; i < state->npending; i++) {
-        if (state->pending_fds[i] == fd)
-            return (i);
-    }
-
-    return (-1);
-}
-
-/*
- * Helper function to invoke port_associate for the given fd and mask.
- */
-static int aeApiAssociate(const char *where, int portfd, int fd, int mask) {
-    int events = 0;
-    int rv, err;
-
-    if (mask & AE_READABLE)
-        events |= POLLIN;
-    if (mask & AE_WRITABLE)
-        events |= POLLOUT;
-
-    if (evport_debug)
-        fprintf(stderr, "%s: port_associate(%d, 0x%x) = ", where, fd, events);
-
-    rv = port_associate(portfd, PORT_SOURCE_FD, fd, events,
-        (void *)(uintptr_t)mask);
-    err = errno;
-
-    if (evport_debug)
-        fprintf(stderr, "%d (%s)\n", rv, rv == 0 ? "no error" : strerror(err));
-
-    if (rv == -1) {
-        fprintf(stderr, "%s: port_associate: %s\n", where, strerror(err));
-
-        if (err == EAGAIN)
-            fprintf(stderr, "aeApiAssociate: event port limit exceeded.");
-    }
-
-    return rv;
-}
-
-static int aeApiAddEvent(aeEventLoop *eventLoop, int fd, int mask) {
-    aeApiState *state = eventLoop->apidata;
-    int fullmask, pfd;
-
-    if (evport_debug)
-        fprintf(stderr, "aeApiAddEvent: fd %d mask 0x%x\n", fd, mask);
-
-    /*
-     * Since port_associate's "events" argument replaces any existing events, we
-     * must be sure to include whatever events are already associated when
-     * we call port_associate() again.
-     */
-    fullmask = mask | eventLoop->events[fd].mask;
-    pfd = aeApiLookupPending(state, fd);
-
-    if (pfd != -1) {
-        /*
-         * This fd was recently returned from aeApiPoll.  It should be safe to
-         * assume that the consumer has processed that poll event, but we play
-         * it safer by simply updating pending_mask.  The fd will be
-         * re-associated as usual when aeApiPoll is called again.
-         */
-        if (evport_debug)
-            fprintf(stderr, "aeApiAddEvent: adding to pending fd %d\n", fd);
-        state->pending_masks[pfd] |= fullmask;
-        return 0;
-    }
-
-    return (aeApiAssociate("aeApiAddEvent", state->portfd, fd, fullmask));
-}
-
-static void aeApiDelEvent(aeEventLoop *eventLoop, int fd, int mask) {
-    aeApiState *state = eventLoop->apidata;
-    int fullmask, pfd;
-
-    if (evport_debug)
-        fprintf(stderr, "del fd %d mask 0x%x\n", fd, mask);
-
-    pfd = aeApiLookupPending(state, fd);
-
-    if (pfd != -1) {
-        if (evport_debug)
-            fprintf(stderr, "deleting event from pending fd %d\n", fd);
-
-        /*
-         * This fd was just returned from aeApiPoll, so it's not currently
-         * associated with the port.  All we need to do is update
-         * pending_mask appropriately.
-         */
-        state->pending_masks[pfd] &= ~mask;
-
-        if (state->pending_masks[pfd] == AE_NONE)
-            state->pending_fds[pfd] = -1;
-
-        return;
-    }
-
-    /*
-     * The fd is currently associated with the port.  Like with the add case
-     * above, we must look at the full mask for the file descriptor before
-     * updating that association.  We don't have a good way of knowing what the
-     * events are without looking into the eventLoop state directly.  We rely on
-     * the fact that our caller has already updated the mask in the eventLoop.
-     */
-
-    fullmask = eventLoop->events[fd].mask;
-    if (fullmask == AE_NONE) {
-        /*
-         * We're removing *all* events, so use port_dissociate to remove the
-         * association completely.  Failure here indicates a bug.
-         */
-        if (evport_debug)
-            fprintf(stderr, "aeApiDelEvent: port_dissociate(%d)\n", fd);
-
-        if (port_dissociate(state->portfd, PORT_SOURCE_FD, fd) != 0) {
-            perror("aeApiDelEvent: port_dissociate");
-            abort(); /* will not return */
-        }
-    } else if (aeApiAssociate("aeApiDelEvent", state->portfd, fd,
-        fullmask) != 0) {
-        /*
-         * ENOMEM is a potentially transient condition, but the kernel won't
-         * generally return it unless things are really bad.  EAGAIN indicates
-         * we've reached an resource limit, for which it doesn't make sense to
-         * retry (counter-intuitively).  All other errors indicate a bug.  In any
-         * of these cases, the best we can do is to abort.
-         */
-        abort(); /* will not return */
-    }
-}
-
-static int aeApiPoll(aeEventLoop *eventLoop, struct timeval *tvp) {
-    aeApiState *state = eventLoop->apidata;
-    struct timespec timeout, *tsp;
-    int mask, i;
-    uint_t nevents;
-    port_event_t event[MAX_EVENT_BATCHSZ];
-
-    /*
-     * If we've returned fd events before, we must re-associate them with the
-     * port now, before calling port_get().  See the block comment at the top of
-     * this file for an explanation of why.
-     */
-    for (i = 0; i < state->npending; i++) {
-        if (state->pending_fds[i] == -1)
-            /* This fd has since been deleted. */
-            continue;
-
-        if (aeApiAssociate("aeApiPoll", state->portfd,
-            state->pending_fds[i], state->pending_masks[i]) != 0) {
-            /* See aeApiDelEvent for why this case is fatal. */
-            abort();
-        }
-
-        state->pending_masks[i] = AE_NONE;
-        state->pending_fds[i] = -1;
-    }
-
-    state->npending = 0;
-
-    if (tvp != NULL) {
-        timeout.tv_sec = tvp->tv_sec;
-        timeout.tv_nsec = tvp->tv_usec * 1000;
-        tsp = &timeout;
-    } else {
-        tsp = NULL;
-    }
-
-    /*
-     * port_getn can return with errno == ETIME having returned some events (!).
-     * So if we get ETIME, we check nevents, too.
-     */
-    nevents = 1;
-    if (port_getn(state->portfd, event, MAX_EVENT_BATCHSZ, &nevents,
-        tsp) == -1 && (errno != ETIME || nevents == 0)) {
-        if (errno == ETIME || errno == EINTR)
-            return 0;
-
-        /* Any other error indicates a bug. */
-        perror("aeApiPoll: port_get");
-        abort();
-    }
-
-    state->npending = nevents;
-
-    for (i = 0; i < nevents; i++) {
-            mask = 0;
-            if (event[i].portev_events & POLLIN)
-                mask |= AE_READABLE;
-            if (event[i].portev_events & POLLOUT)
-                mask |= AE_WRITABLE;
-
-            eventLoop->fired[i].fd = event[i].portev_object;
-            eventLoop->fired[i].mask = mask;
-
-            if (evport_debug)
-                fprintf(stderr, "aeApiPoll: fd %d mask 0x%x\n",
-                    (int)event[i].portev_object, mask);
-
-            state->pending_fds[i] = event[i].portev_object;
-            state->pending_masks[i] = (uintptr_t)event[i].portev_user;
-    }
-
-    return nevents;
-}
-
-static char *aeApiName(void) {
-    return "evport";
-}
diff --git a/src/plasma/thirdparty/ae/ae_kqueue.c b/src/plasma/thirdparty/ae/ae_kqueue.c
deleted file mode 100644
index 6796f4ceb5939..0000000000000
--- a/src/plasma/thirdparty/ae/ae_kqueue.c
+++ /dev/null
@@ -1,138 +0,0 @@
-/* Kqueue(2)-based ae.c module
- *
- * Copyright (C) 2009 Harish Mallipeddi - harish.mallipeddi@gmail.com
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- *   * Redistributions of source code must retain the above copyright notice,
- *     this list of conditions and the following disclaimer.
- *   * Redistributions in binary form must reproduce the above copyright
- *     notice, this list of conditions and the following disclaimer in the
- *     documentation and/or other materials provided with the distribution.
- *   * Neither the name of Redis nor the names of its contributors may be used
- *     to endorse or promote products derived from this software without
- *     specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
- * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
- * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
- * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
- * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
- * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
- * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
- * POSSIBILITY OF SUCH DAMAGE.
- */
-
-
-#include <sys/types.h>
-#include <sys/event.h>
-#include <sys/time.h>
-
-typedef struct aeApiState {
-    int kqfd;
-    struct kevent *events;
-} aeApiState;
-
-static int aeApiCreate(aeEventLoop *eventLoop) {
-    aeApiState *state = zmalloc(sizeof(aeApiState));
-
-    if (!state) return -1;
-    state->events = zmalloc(sizeof(struct kevent)*eventLoop->setsize);
-    if (!state->events) {
-        zfree(state);
-        return -1;
-    }
-    state->kqfd = kqueue();
-    if (state->kqfd == -1) {
-        zfree(state->events);
-        zfree(state);
-        return -1;
-    }
-    eventLoop->apidata = state;
-    return 0;
-}
-
-static int aeApiResize(aeEventLoop *eventLoop, int setsize) {
-    aeApiState *state = eventLoop->apidata;
-
-    state->events = zrealloc(state->events, sizeof(struct kevent)*setsize);
-    return 0;
-}
-
-static void aeApiFree(aeEventLoop *eventLoop) {
-    aeApiState *state = eventLoop->apidata;
-
-    close(state->kqfd);
-    zfree(state->events);
-    zfree(state);
-}
-
-static int aeApiAddEvent(aeEventLoop *eventLoop, int fd, int mask) {
-    aeApiState *state = eventLoop->apidata;
-    struct kevent ke;
-
-    if (mask & AE_READABLE) {
-        EV_SET(&ke, fd, EVFILT_READ, EV_ADD, 0, 0, NULL);
-        if (kevent(state->kqfd, &ke, 1, NULL, 0, NULL) == -1) return -1;
-    }
-    if (mask & AE_WRITABLE) {
-        EV_SET(&ke, fd, EVFILT_WRITE, EV_ADD, 0, 0, NULL);
-        if (kevent(state->kqfd, &ke, 1, NULL, 0, NULL) == -1) return -1;
-    }
-    return 0;
-}
-
-static void aeApiDelEvent(aeEventLoop *eventLoop, int fd, int mask) {
-    aeApiState *state = eventLoop->apidata;
-    struct kevent ke;
-
-    if (mask & AE_READABLE) {
-        EV_SET(&ke, fd, EVFILT_READ, EV_DELETE, 0, 0, NULL);
-        kevent(state->kqfd, &ke, 1, NULL, 0, NULL);
-    }
-    if (mask & AE_WRITABLE) {
-        EV_SET(&ke, fd, EVFILT_WRITE, EV_DELETE, 0, 0, NULL);
-        kevent(state->kqfd, &ke, 1, NULL, 0, NULL);
-    }
-}
-
-static int aeApiPoll(aeEventLoop *eventLoop, struct timeval *tvp) {
-    aeApiState *state = eventLoop->apidata;
-    int retval, numevents = 0;
-
-    if (tvp != NULL) {
-        struct timespec timeout;
-        timeout.tv_sec = tvp->tv_sec;
-        timeout.tv_nsec = tvp->tv_usec * 1000;
-        retval = kevent(state->kqfd, NULL, 0, state->events, eventLoop->setsize,
-                        &timeout);
-    } else {
-        retval = kevent(state->kqfd, NULL, 0, state->events, eventLoop->setsize,
-                        NULL);
-    }
-
-    if (retval > 0) {
-        int j;
-
-        numevents = retval;
-        for(j = 0; j < numevents; j++) {
-            int mask = 0;
-            struct kevent *e = state->events+j;
-
-            if (e->filter == EVFILT_READ) mask |= AE_READABLE;
-            if (e->filter == EVFILT_WRITE) mask |= AE_WRITABLE;
-            eventLoop->fired[j].fd = e->ident;
-            eventLoop->fired[j].mask = mask;
-        }
-    }
-    return numevents;
-}
-
-static char *aeApiName(void) {
-    return "kqueue";
-}
diff --git a/src/plasma/thirdparty/ae/ae_select.c b/src/plasma/thirdparty/ae/ae_select.c
deleted file mode 100644
index c039a8ea3128d..0000000000000
--- a/src/plasma/thirdparty/ae/ae_select.c
+++ /dev/null
@@ -1,106 +0,0 @@
-/* Select()-based ae.c module.
- *
- * Copyright (c) 2009-2012, Salvatore Sanfilippo <antirez at gmail dot com>
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- *   * Redistributions of source code must retain the above copyright notice,
- *     this list of conditions and the following disclaimer.
- *   * Redistributions in binary form must reproduce the above copyright
- *     notice, this list of conditions and the following disclaimer in the
- *     documentation and/or other materials provided with the distribution.
- *   * Neither the name of Redis nor the names of its contributors may be used
- *     to endorse or promote products derived from this software without
- *     specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
- * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
- * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
- * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
- * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
- * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
- * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
- * POSSIBILITY OF SUCH DAMAGE.
- */
-
-
-#include <sys/select.h>
-#include <string.h>
-
-typedef struct aeApiState {
-    fd_set rfds, wfds;
-    /* We need to have a copy of the fd sets as it's not safe to reuse
-     * FD sets after select(). */
-    fd_set _rfds, _wfds;
-} aeApiState;
-
-static int aeApiCreate(aeEventLoop *eventLoop) {
-    aeApiState *state = zmalloc(sizeof(aeApiState));
-
-    if (!state) return -1;
-    FD_ZERO(&state->rfds);
-    FD_ZERO(&state->wfds);
-    eventLoop->apidata = state;
-    return 0;
-}
-
-static int aeApiResize(aeEventLoop *eventLoop, int setsize) {
-    /* Just ensure we have enough room in the fd_set type. */
-    if (setsize >= FD_SETSIZE) return -1;
-    return 0;
-}
-
-static void aeApiFree(aeEventLoop *eventLoop) {
-    zfree(eventLoop->apidata);
-}
-
-static int aeApiAddEvent(aeEventLoop *eventLoop, int fd, int mask) {
-    aeApiState *state = eventLoop->apidata;
-
-    if (mask & AE_READABLE) FD_SET(fd,&state->rfds);
-    if (mask & AE_WRITABLE) FD_SET(fd,&state->wfds);
-    return 0;
-}
-
-static void aeApiDelEvent(aeEventLoop *eventLoop, int fd, int mask) {
-    aeApiState *state = eventLoop->apidata;
-
-    if (mask & AE_READABLE) FD_CLR(fd,&state->rfds);
-    if (mask & AE_WRITABLE) FD_CLR(fd,&state->wfds);
-}
-
-static int aeApiPoll(aeEventLoop *eventLoop, struct timeval *tvp) {
-    aeApiState *state = eventLoop->apidata;
-    int retval, j, numevents = 0;
-
-    memcpy(&state->_rfds,&state->rfds,sizeof(fd_set));
-    memcpy(&state->_wfds,&state->wfds,sizeof(fd_set));
-
-    retval = select(eventLoop->maxfd+1,
-                &state->_rfds,&state->_wfds,NULL,tvp);
-    if (retval > 0) {
-        for (j = 0; j <= eventLoop->maxfd; j++) {
-            int mask = 0;
-            aeFileEvent *fe = &eventLoop->events[j];
-
-            if (fe->mask == AE_NONE) continue;
-            if (fe->mask & AE_READABLE && FD_ISSET(j,&state->_rfds))
-                mask |= AE_READABLE;
-            if (fe->mask & AE_WRITABLE && FD_ISSET(j,&state->_wfds))
-                mask |= AE_WRITABLE;
-            eventLoop->fired[numevents].fd = j;
-            eventLoop->fired[numevents].mask = mask;
-            numevents++;
-        }
-    }
-    return numevents;
-}
-
-static char *aeApiName(void) {
-    return "select";
-}
diff --git a/src/plasma/thirdparty/ae/config.h b/src/plasma/thirdparty/ae/config.h
deleted file mode 100644
index 4f8e1ea1bc38c..0000000000000
--- a/src/plasma/thirdparty/ae/config.h
+++ /dev/null
@@ -1,54 +0,0 @@
-/*
- * Copyright (c) 2009-2012, Salvatore Sanfilippo <antirez at gmail dot com>
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- *   * Redistributions of source code must retain the above copyright notice,
- *     this list of conditions and the following disclaimer.
- *   * Redistributions in binary form must reproduce the above copyright
- *     notice, this list of conditions and the following disclaimer in the
- *     documentation and/or other materials provided with the distribution.
- *   * Neither the name of Redis nor the names of its contributors may be used
- *     to endorse or promote products derived from this software without
- *     specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
- * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
- * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
- * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
- * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
- * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
- * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
- * POSSIBILITY OF SUCH DAMAGE.
- */
-
-#ifndef __CONFIG_H
-#define __CONFIG_H
-
-#ifdef __APPLE__
-#include <AvailabilityMacros.h>
-#endif
-
-/* Test for polling API */
-#ifdef __linux__
-#define HAVE_EPOLL 1
-#endif
-
-#if (defined(__APPLE__) && defined(MAC_OS_X_VERSION_10_6)) || defined(__FreeBSD__) || defined(__OpenBSD__) || defined (__NetBSD__)
-#define HAVE_KQUEUE 1
-#endif
-
-#ifdef __sun
-#include <sys/feature_tests.h>
-#ifdef _DTRACE_VERSION
-#define HAVE_EVPORT 1
-#endif
-#endif
-
-
-#endif
diff --git a/src/plasma/thirdparty/ae/zmalloc.h b/src/plasma/thirdparty/ae/zmalloc.h
deleted file mode 100644
index 54c8a69cb2e20..0000000000000
--- a/src/plasma/thirdparty/ae/zmalloc.h
+++ /dev/null
@@ -1,16 +0,0 @@
-#ifndef _ZMALLOC_H
-#define _ZMALLOC_H
-
-#ifndef zmalloc
-#define zmalloc malloc
-#endif
-
-#ifndef zfree
-#define zfree free
-#endif
-
-#ifndef zrealloc
-#define zrealloc realloc
-#endif
-
-#endif /* _ZMALLOC_H */
diff --git a/src/plasma/thirdparty/dlmalloc.c b/src/plasma/thirdparty/dlmalloc.c
deleted file mode 100644
index 84ccbd28fc4ec..0000000000000
--- a/src/plasma/thirdparty/dlmalloc.c
+++ /dev/null
@@ -1,6281 +0,0 @@
-/*
-  This is a version (aka dlmalloc) of malloc/free/realloc written by
-  Doug Lea and released to the public domain, as explained at
-  http://creativecommons.org/publicdomain/zero/1.0/ Send questions,
-  comments, complaints, performance data, etc to dl@cs.oswego.edu
-
-* Version 2.8.6 Wed Aug 29 06:57:58 2012  Doug Lea
-   Note: There may be an updated version of this malloc obtainable at
-           ftp://gee.cs.oswego.edu/pub/misc/malloc.c
-         Check before installing!
-
-* Quickstart
-
-  This library is all in one file to simplify the most common usage:
-  ftp it, compile it (-O3), and link it into another program. All of
-  the compile-time options default to reasonable values for use on
-  most platforms.  You might later want to step through various
-  compile-time and dynamic tuning options.
-
-  For convenience, an include file for code using this malloc is at:
-     ftp://gee.cs.oswego.edu/pub/misc/malloc-2.8.6.h
-  You don't really need this .h file unless you call functions not
-  defined in your system include files.  The .h file contains only the
-  excerpts from this file needed for using this malloc on ANSI C/C++
-  systems, so long as you haven't changed compile-time options about
-  naming and tuning parameters.  If you do, then you can create your
-  own malloc.h that does include all settings by cutting at the point
-  indicated below. Note that you may already by default be using a C
-  library containing a malloc that is based on some version of this
-  malloc (for example in linux). You might still want to use the one
-  in this file to customize settings or to avoid overheads associated
-  with library versions.
-
-* Vital statistics:
-
-  Supported pointer/size_t representation:       4 or 8 bytes
-       size_t MUST be an unsigned type of the same width as
-       pointers. (If you are using an ancient system that declares
-       size_t as a signed type, or need it to be a different width
-       than pointers, you can use a previous release of this malloc
-       (e.g. 2.7.2) supporting these.)
-
-  Alignment:                                     8 bytes (minimum)
-       This suffices for nearly all current machines and C compilers.
-       However, you can define MALLOC_ALIGNMENT to be wider than this
-       if necessary (up to 128bytes), at the expense of using more space.
-
-  Minimum overhead per allocated chunk:   4 or  8 bytes (if 4byte sizes)
-                                          8 or 16 bytes (if 8byte sizes)
-       Each malloced chunk has a hidden word of overhead holding size
-       and status information, and additional cross-check word
-       if FOOTERS is defined.
-
-  Minimum allocated size: 4-byte ptrs:  16 bytes    (including overhead)
-                          8-byte ptrs:  32 bytes    (including overhead)
-
-       Even a request for zero bytes (i.e., malloc(0)) returns a
-       pointer to something of the minimum allocatable size.
-       The maximum overhead wastage (i.e., number of extra bytes
-       allocated than were requested in malloc) is less than or equal
-       to the minimum size, except for requests >= mmap_threshold that
-       are serviced via mmap(), where the worst case wastage is about
-       32 bytes plus the remainder from a system page (the minimal
-       mmap unit); typically 4096 or 8192 bytes.
-
-  Security: static-safe; optionally more or less
-       The "security" of malloc refers to the ability of malicious
-       code to accentuate the effects of errors (for example, freeing
-       space that is not currently malloc'ed or overwriting past the
-       ends of chunks) in code that calls malloc.  This malloc
-       guarantees not to modify any memory locations below the base of
-       heap, i.e., static variables, even in the presence of usage
-       errors.  The routines additionally detect most improper frees
-       and reallocs.  All this holds as long as the static bookkeeping
-       for malloc itself is not corrupted by some other means.  This
-       is only one aspect of security -- these checks do not, and
-       cannot, detect all possible programming errors.
-
-       If FOOTERS is defined nonzero, then each allocated chunk
-       carries an additional check word to verify that it was malloced
-       from its space.  These check words are the same within each
-       execution of a program using malloc, but differ across
-       executions, so externally crafted fake chunks cannot be
-       freed. This improves security by rejecting frees/reallocs that
-       could corrupt heap memory, in addition to the checks preventing
-       writes to statics that are always on.  This may further improve
-       security at the expense of time and space overhead.  (Note that
-       FOOTERS may also be worth using with MSPACES.)
-
-       By default detected errors cause the program to abort (calling
-       "abort()"). You can override this to instead proceed past
-       errors by defining PROCEED_ON_ERROR.  In this case, a bad free
-       has no effect, and a malloc that encounters a bad address
-       caused by user overwrites will ignore the bad address by
-       dropping pointers and indices to all known memory. This may
-       be appropriate for programs that should continue if at all
-       possible in the face of programming errors, although they may
-       run out of memory because dropped memory is never reclaimed.
-
-       If you don't like either of these options, you can define
-       CORRUPTION_ERROR_ACTION and USAGE_ERROR_ACTION to do anything
-       else. And if if you are sure that your program using malloc has
-       no errors or vulnerabilities, you can define INSECURE to 1,
-       which might (or might not) provide a small performance improvement.
-
-       It is also possible to limit the maximum total allocatable
-       space, using malloc_set_footprint_limit. This is not
-       designed as a security feature in itself (calls to set limits
-       are not screened or privileged), but may be useful as one
-       aspect of a secure implementation.
-
-  Thread-safety: NOT thread-safe unless USE_LOCKS defined non-zero
-       When USE_LOCKS is defined, each public call to malloc, free,
-       etc is surrounded with a lock. By default, this uses a plain
-       pthread mutex, win32 critical section, or a spin-lock if if
-       available for the platform and not disabled by setting
-       USE_SPIN_LOCKS=0.  However, if USE_RECURSIVE_LOCKS is defined,
-       recursive versions are used instead (which are not required for
-       base functionality but may be needed in layered extensions).
-       Using a global lock is not especially fast, and can be a major
-       bottleneck.  It is designed only to provide minimal protection
-       in concurrent environments, and to provide a basis for
-       extensions.  If you are using malloc in a concurrent program,
-       consider instead using nedmalloc
-       (http://www.nedprod.com/programs/portable/nedmalloc/) or
-       ptmalloc (See http://www.malloc.de), which are derived from
-       versions of this malloc.
-
-  System requirements: Any combination of MORECORE and/or MMAP/MUNMAP
-       This malloc can use unix sbrk or any emulation (invoked using
-       the CALL_MORECORE macro) and/or mmap/munmap or any emulation
-       (invoked using CALL_MMAP/CALL_MUNMAP) to get and release system
-       memory.  On most unix systems, it tends to work best if both
-       MORECORE and MMAP are enabled.  On Win32, it uses emulations
-       based on VirtualAlloc. It also uses common C library functions
-       like memset.
-
-  Compliance: I believe it is compliant with the Single Unix Specification
-       (See http://www.unix.org). Also SVID/XPG, ANSI C, and probably
-       others as well.
-
-* Overview of algorithms
-
-  This is not the fastest, most space-conserving, most portable, or
-  most tunable malloc ever written. However it is among the fastest
-  while also being among the most space-conserving, portable and
-  tunable.  Consistent balance across these factors results in a good
-  general-purpose allocator for malloc-intensive programs.
-
-  In most ways, this malloc is a best-fit allocator. Generally, it
-  chooses the best-fitting existing chunk for a request, with ties
-  broken in approximately least-recently-used order. (This strategy
-  normally maintains low fragmentation.) However, for requests less
-  than 256bytes, it deviates from best-fit when there is not an
-  exactly fitting available chunk by preferring to use space adjacent
-  to that used for the previous small request, as well as by breaking
-  ties in approximately most-recently-used order. (These enhance
-  locality of series of small allocations.)  And for very large requests
-  (>= 256Kb by default), it relies on system memory mapping
-  facilities, if supported.  (This helps avoid carrying around and
-  possibly fragmenting memory used only for large chunks.)
-
-  All operations (except malloc_stats and mallinfo) have execution
-  times that are bounded by a constant factor of the number of bits in
-  a size_t, not counting any clearing in calloc or copying in realloc,
-  or actions surrounding MORECORE and MMAP that have times
-  proportional to the number of non-contiguous regions returned by
-  system allocation routines, which is often just 1. In real-time
-  applications, you can optionally suppress segment traversals using
-  NO_SEGMENT_TRAVERSAL, which assures bounded execution even when
-  system allocators return non-contiguous spaces, at the typical
-  expense of carrying around more memory and increased fragmentation.
-
-  The implementation is not very modular and seriously overuses
-  macros. Perhaps someday all C compilers will do as good a job
-  inlining modular code as can now be done by brute-force expansion,
-  but now, enough of them seem not to.
-
-  Some compilers issue a lot of warnings about code that is
-  dead/unreachable only on some platforms, and also about intentional
-  uses of negation on unsigned types. All known cases of each can be
-  ignored.
-
-  For a longer but out of date high-level description, see
-     http://gee.cs.oswego.edu/dl/html/malloc.html
-
-* MSPACES
-  If MSPACES is defined, then in addition to malloc, free, etc.,
-  this file also defines mspace_malloc, mspace_free, etc. These
-  are versions of malloc routines that take an "mspace" argument
-  obtained using create_mspace, to control all internal bookkeeping.
-  If ONLY_MSPACES is defined, only these versions are compiled.
-  So if you would like to use this allocator for only some allocations,
-  and your system malloc for others, you can compile with
-  ONLY_MSPACES and then do something like...
-    static mspace mymspace = create_mspace(0,0); // for example
-    #define mymalloc(bytes)  mspace_malloc(mymspace, bytes)
-
-  (Note: If you only need one instance of an mspace, you can instead
-  use "USE_DL_PREFIX" to relabel the global malloc.)
-
-  You can similarly create thread-local allocators by storing
-  mspaces as thread-locals. For example:
-    static __thread mspace tlms = 0;
-    void*  tlmalloc(size_t bytes) {
-      if (tlms == 0) tlms = create_mspace(0, 0);
-      return mspace_malloc(tlms, bytes);
-    }
-    void  tlfree(void* mem) { mspace_free(tlms, mem); }
-
-  Unless FOOTERS is defined, each mspace is completely independent.
-  You cannot allocate from one and free to another (although
-  conformance is only weakly checked, so usage errors are not always
-  caught). If FOOTERS is defined, then each chunk carries around a tag
-  indicating its originating mspace, and frees are directed to their
-  originating spaces. Normally, this requires use of locks.
-
- -------------------------  Compile-time options ---------------------------
-
-Be careful in setting #define values for numerical constants of type
-size_t. On some systems, literal values are not automatically extended
-to size_t precision unless they are explicitly casted. You can also
-use the symbolic values MAX_SIZE_T, SIZE_T_ONE, etc below.
-
-WIN32                    default: defined if _WIN32 defined
-  Defining WIN32 sets up defaults for MS environment and compilers.
-  Otherwise defaults are for unix. Beware that there seem to be some
-  cases where this malloc might not be a pure drop-in replacement for
-  Win32 malloc: Random-looking failures from Win32 GDI API's (eg;
-  SetDIBits()) may be due to bugs in some video driver implementations
-  when pixel buffers are malloc()ed, and the region spans more than
-  one VirtualAlloc()ed region. Because dlmalloc uses a small (64Kb)
-  default granularity, pixel buffers may straddle virtual allocation
-  regions more often than when using the Microsoft allocator.  You can
-  avoid this by using VirtualAlloc() and VirtualFree() for all pixel
-  buffers rather than using malloc().  If this is not possible,
-  recompile this malloc with a larger DEFAULT_GRANULARITY. Note:
-  in cases where MSC and gcc (cygwin) are known to differ on WIN32,
-  conditions use _MSC_VER to distinguish them.
-
-DLMALLOC_EXPORT       default: extern
-  Defines how public APIs are declared. If you want to export via a
-  Windows DLL, you might define this as
-    #define DLMALLOC_EXPORT extern  __declspec(dllexport)
-  If you want a POSIX ELF shared object, you might use
-    #define DLMALLOC_EXPORT extern __attribute__((visibility("default")))
-
-MALLOC_ALIGNMENT         default: (size_t)(2 * sizeof(void *))
-  Controls the minimum alignment for malloc'ed chunks.  It must be a
-  power of two and at least 8, even on machines for which smaller
-  alignments would suffice. It may be defined as larger than this
-  though. Note however that code and data structures are optimized for
-  the case of 8-byte alignment.
-
-MSPACES                  default: 0 (false)
-  If true, compile in support for independent allocation spaces.
-  This is only supported if HAVE_MMAP is true.
-
-ONLY_MSPACES             default: 0 (false)
-  If true, only compile in mspace versions, not regular versions.
-
-USE_LOCKS                default: 0 (false)
-  Causes each call to each public routine to be surrounded with
-  pthread or WIN32 mutex lock/unlock. (If set true, this can be
-  overridden on a per-mspace basis for mspace versions.) If set to a
-  non-zero value other than 1, locks are used, but their
-  implementation is left out, so lock functions must be supplied manually,
-  as described below.
-
-USE_SPIN_LOCKS           default: 1 iff USE_LOCKS and spin locks available
-  If true, uses custom spin locks for locking. This is currently
-  supported only gcc >= 4.1, older gccs on x86 platforms, and recent
-  MS compilers.  Otherwise, posix locks or win32 critical sections are
-  used.
-
-USE_RECURSIVE_LOCKS      default: not defined
-  If defined nonzero, uses recursive (aka reentrant) locks, otherwise
-  uses plain mutexes. This is not required for malloc proper, but may
-  be needed for layered allocators such as nedmalloc.
-
-LOCK_AT_FORK            default: not defined
-  If defined nonzero, performs pthread_atfork upon initialization
-  to initialize child lock while holding parent lock. The implementation
-  assumes that pthread locks (not custom locks) are being used. In other
-  cases, you may need to customize the implementation.
-
-FOOTERS                  default: 0
-  If true, provide extra checking and dispatching by placing
-  information in the footers of allocated chunks. This adds
-  space and time overhead.
-
-INSECURE                 default: 0
-  If true, omit checks for usage errors and heap space overwrites.
-
-USE_DL_PREFIX            default: NOT defined
-  Causes compiler to prefix all public routines with the string 'dl'.
-  This can be useful when you only want to use this malloc in one part
-  of a program, using your regular system malloc elsewhere.
-
-MALLOC_INSPECT_ALL       default: NOT defined
-  If defined, compiles malloc_inspect_all and mspace_inspect_all, that
-  perform traversal of all heap space.  Unless access to these
-  functions is otherwise restricted, you probably do not want to
-  include them in secure implementations.
-
-ABORT                    default: defined as abort()
-  Defines how to abort on failed checks.  On most systems, a failed
-  check cannot die with an "assert" or even print an informative
-  message, because the underlying print routines in turn call malloc,
-  which will fail again.  Generally, the best policy is to simply call
-  abort(). It's not very useful to do more than this because many
-  errors due to overwriting will show up as address faults (null, odd
-  addresses etc) rather than malloc-triggered checks, so will also
-  abort.  Also, most compilers know that abort() does not return, so
-  can better optimize code conditionally calling it.
-
-PROCEED_ON_ERROR           default: defined as 0 (false)
-  Controls whether detected bad addresses cause them to bypassed
-  rather than aborting. If set, detected bad arguments to free and
-  realloc are ignored. And all bookkeeping information is zeroed out
-  upon a detected overwrite of freed heap space, thus losing the
-  ability to ever return it from malloc again, but enabling the
-  application to proceed. If PROCEED_ON_ERROR is defined, the
-  static variable malloc_corruption_error_count is compiled in
-  and can be examined to see if errors have occurred. This option
-  generates slower code than the default abort policy.
-
-DEBUG                    default: NOT defined
-  The DEBUG setting is mainly intended for people trying to modify
-  this code or diagnose problems when porting to new platforms.
-  However, it may also be able to better isolate user errors than just
-  using runtime checks.  The assertions in the check routines spell
-  out in more detail the assumptions and invariants underlying the
-  algorithms.  The checking is fairly extensive, and will slow down
-  execution noticeably. Calling malloc_stats or mallinfo with DEBUG
-  set will attempt to check every non-mmapped allocated and free chunk
-  in the course of computing the summaries.
-
-ABORT_ON_ASSERT_FAILURE   default: defined as 1 (true)
-  Debugging assertion failures can be nearly impossible if your
-  version of the assert macro causes malloc to be called, which will
-  lead to a cascade of further failures, blowing the runtime stack.
-  ABORT_ON_ASSERT_FAILURE cause assertions failures to call abort(),
-  which will usually make debugging easier.
-
-MALLOC_FAILURE_ACTION     default: sets errno to ENOMEM, or no-op on win32
-  The action to take before "return 0" when malloc fails to be able to
-  return memory because there is none available.
-
-HAVE_MORECORE             default: 1 (true) unless win32 or ONLY_MSPACES
-  True if this system supports sbrk or an emulation of it.
-
-MORECORE                  default: sbrk
-  The name of the sbrk-style system routine to call to obtain more
-  memory.  See below for guidance on writing custom MORECORE
-  functions. The type of the argument to sbrk/MORECORE varies across
-  systems.  It cannot be size_t, because it supports negative
-  arguments, so it is normally the signed type of the same width as
-  size_t (sometimes declared as "intptr_t").  It doesn't much matter
-  though. Internally, we only call it with arguments less than half
-  the max value of a size_t, which should work across all reasonable
-  possibilities, although sometimes generating compiler warnings.
-
-MORECORE_CONTIGUOUS       default: 1 (true) if HAVE_MORECORE
-  If true, take advantage of fact that consecutive calls to MORECORE
-  with positive arguments always return contiguous increasing
-  addresses.  This is true of unix sbrk. It does not hurt too much to
-  set it true anyway, since malloc copes with non-contiguities.
-  Setting it false when definitely non-contiguous saves time
-  and possibly wasted space it would take to discover this though.
-
-MORECORE_CANNOT_TRIM      default: NOT defined
-  True if MORECORE cannot release space back to the system when given
-  negative arguments. This is generally necessary only if you are
-  using a hand-crafted MORECORE function that cannot handle negative
-  arguments.
-
-NO_SEGMENT_TRAVERSAL       default: 0
-  If non-zero, suppresses traversals of memory segments
-  returned by either MORECORE or CALL_MMAP. This disables
-  merging of segments that are contiguous, and selectively
-  releasing them to the OS if unused, but bounds execution times.
-
-HAVE_MMAP                 default: 1 (true)
-  True if this system supports mmap or an emulation of it.  If so, and
-  HAVE_MORECORE is not true, MMAP is used for all system
-  allocation. If set and HAVE_MORECORE is true as well, MMAP is
-  primarily used to directly allocate very large blocks. It is also
-  used as a backup strategy in cases where MORECORE fails to provide
-  space from system. Note: A single call to MUNMAP is assumed to be
-  able to unmap memory that may have be allocated using multiple calls
-  to MMAP, so long as they are adjacent.
-
-HAVE_MREMAP               default: 1 on linux, else 0
-  If true realloc() uses mremap() to re-allocate large blocks and
-  extend or shrink allocation spaces.
-
-MMAP_CLEARS               default: 1 except on WINCE.
-  True if mmap clears memory so calloc doesn't need to. This is true
-  for standard unix mmap using /dev/zero and on WIN32 except for WINCE.
-
-USE_BUILTIN_FFS            default: 0 (i.e., not used)
-  Causes malloc to use the builtin ffs() function to compute indices.
-  Some compilers may recognize and intrinsify ffs to be faster than the
-  supplied C version. Also, the case of x86 using gcc is special-cased
-  to an asm instruction, so is already as fast as it can be, and so
-  this setting has no effect. Similarly for Win32 under recent MS compilers.
-  (On most x86s, the asm version is only slightly faster than the C version.)
-
-malloc_getpagesize         default: derive from system includes, or 4096.
-  The system page size. To the extent possible, this malloc manages
-  memory from the system in page-size units.  This may be (and
-  usually is) a function rather than a constant. This is ignored
-  if WIN32, where page size is determined using getSystemInfo during
-  initialization.
-
-USE_DEV_RANDOM             default: 0 (i.e., not used)
-  Causes malloc to use /dev/random to initialize secure magic seed for
-  stamping footers. Otherwise, the current time is used.
-
-NO_MALLINFO                default: 0
-  If defined, don't compile "mallinfo". This can be a simple way
-  of dealing with mismatches between system declarations and
-  those in this file.
-
-MALLINFO_FIELD_TYPE        default: size_t
-  The type of the fields in the mallinfo struct. This was originally
-  defined as "int" in SVID etc, but is more usefully defined as
-  size_t. The value is used only if  HAVE_USR_INCLUDE_MALLOC_H is not set
-
-NO_MALLOC_STATS            default: 0
-  If defined, don't compile "malloc_stats". This avoids calls to
-  fprintf and bringing in stdio dependencies you might not want.
-
-REALLOC_ZERO_BYTES_FREES    default: not defined
-  This should be set if a call to realloc with zero bytes should
-  be the same as a call to free. Some people think it should. Otherwise,
-  since this malloc returns a unique pointer for malloc(0), so does
-  realloc(p, 0).
-
-LACKS_UNISTD_H, LACKS_FCNTL_H, LACKS_SYS_PARAM_H, LACKS_SYS_MMAN_H
-LACKS_STRINGS_H, LACKS_STRING_H, LACKS_SYS_TYPES_H,  LACKS_ERRNO_H
-LACKS_STDLIB_H LACKS_SCHED_H LACKS_TIME_H  default: NOT defined unless on WIN32
-  Define these if your system does not have these header files.
-  You might need to manually insert some of the declarations they provide.
-
-DEFAULT_GRANULARITY        default: page size if MORECORE_CONTIGUOUS,
-                                system_info.dwAllocationGranularity in WIN32,
-                                otherwise 64K.
-      Also settable using mallopt(M_GRANULARITY, x)
-  The unit for allocating and deallocating memory from the system.  On
-  most systems with contiguous MORECORE, there is no reason to
-  make this more than a page. However, systems with MMAP tend to
-  either require or encourage larger granularities.  You can increase
-  this value to prevent system allocation functions to be called so
-  often, especially if they are slow.  The value must be at least one
-  page and must be a power of two.  Setting to 0 causes initialization
-  to either page size or win32 region size.  (Note: In previous
-  versions of malloc, the equivalent of this option was called
-  "TOP_PAD")
-
-DEFAULT_TRIM_THRESHOLD    default: 2MB
-      Also settable using mallopt(M_TRIM_THRESHOLD, x)
-  The maximum amount of unused top-most memory to keep before
-  releasing via malloc_trim in free().  Automatic trimming is mainly
-  useful in long-lived programs using contiguous MORECORE.  Because
-  trimming via sbrk can be slow on some systems, and can sometimes be
-  wasteful (in cases where programs immediately afterward allocate
-  more large chunks) the value should be high enough so that your
-  overall system performance would improve by releasing this much
-  memory.  As a rough guide, you might set to a value close to the
-  average size of a process (program) running on your system.
-  Releasing this much memory would allow such a process to run in
-  memory.  Generally, it is worth tuning trim thresholds when a
-  program undergoes phases where several large chunks are allocated
-  and released in ways that can reuse each other's storage, perhaps
-  mixed with phases where there are no such chunks at all. The trim
-  value must be greater than page size to have any useful effect.  To
-  disable trimming completely, you can set to MAX_SIZE_T. Note that the trick
-  some people use of mallocing a huge space and then freeing it at
-  program startup, in an attempt to reserve system memory, doesn't
-  have the intended effect under automatic trimming, since that memory
-  will immediately be returned to the system.
-
-DEFAULT_MMAP_THRESHOLD       default: 256K
-      Also settable using mallopt(M_MMAP_THRESHOLD, x)
-  The request size threshold for using MMAP to directly service a
-  request. Requests of at least this size that cannot be allocated
-  using already-existing space will be serviced via mmap.  (If enough
-  normal freed space already exists it is used instead.)  Using mmap
-  segregates relatively large chunks of memory so that they can be
-  individually obtained and released from the host system. A request
-  serviced through mmap is never reused by any other request (at least
-  not directly; the system may just so happen to remap successive
-  requests to the same locations).  Segregating space in this way has
-  the benefits that: Mmapped space can always be individually released
-  back to the system, which helps keep the system level memory demands
-  of a long-lived program low.  Also, mapped memory doesn't become
-  `locked' between other chunks, as can happen with normally allocated
-  chunks, which means that even trimming via malloc_trim would not
-  release them.  However, it has the disadvantage that the space
-  cannot be reclaimed, consolidated, and then used to service later
-  requests, as happens with normal chunks.  The advantages of mmap
-  nearly always outweigh disadvantages for "large" chunks, but the
-  value of "large" may vary across systems.  The default is an
-  empirically derived value that works well in most systems. You can
-  disable mmap by setting to MAX_SIZE_T.
-
-MAX_RELEASE_CHECK_RATE   default: 4095 unless not HAVE_MMAP
-  The number of consolidated frees between checks to release
-  unused segments when freeing. When using non-contiguous segments,
-  especially with multiple mspaces, checking only for topmost space
-  doesn't always suffice to trigger trimming. To compensate for this,
-  free() will, with a period of MAX_RELEASE_CHECK_RATE (or the
-  current number of segments, if greater) try to release unused
-  segments to the OS when freeing chunks that result in
-  consolidation. The best value for this parameter is a compromise
-  between slowing down frees with relatively costly checks that
-  rarely trigger versus holding on to unused memory. To effectively
-  disable, set to MAX_SIZE_T. This may lead to a very slight speed
-  improvement at the expense of carrying around more memory.
-*/
-
-/* Version identifier to allow people to support multiple versions */
-#ifndef DLMALLOC_VERSION
-#define DLMALLOC_VERSION 20806
-#endif /* DLMALLOC_VERSION */
-
-#ifndef DLMALLOC_EXPORT
-#define DLMALLOC_EXPORT extern
-#endif
-
-#ifndef WIN32
-#ifdef _WIN32
-#define WIN32 1
-#endif  /* _WIN32 */
-#ifdef _WIN32_WCE
-#define LACKS_FCNTL_H
-#define WIN32 1
-#endif /* _WIN32_WCE */
-#endif  /* WIN32 */
-#ifdef WIN32
-#define WIN32_LEAN_AND_MEAN
-#include <windows.h>
-#include <tchar.h>
-#define HAVE_MMAP 1
-#define HAVE_MORECORE 0
-#define LACKS_UNISTD_H
-#define LACKS_SYS_PARAM_H
-#define LACKS_SYS_MMAN_H
-#define LACKS_STRING_H
-#define LACKS_STRINGS_H
-#define LACKS_SYS_TYPES_H
-#define LACKS_ERRNO_H
-#define LACKS_SCHED_H
-#ifndef MALLOC_FAILURE_ACTION
-#define MALLOC_FAILURE_ACTION
-#endif /* MALLOC_FAILURE_ACTION */
-#ifndef MMAP_CLEARS
-#ifdef _WIN32_WCE /* WINCE reportedly does not clear */
-#define MMAP_CLEARS 0
-#else
-#define MMAP_CLEARS 1
-#endif /* _WIN32_WCE */
-#endif /*MMAP_CLEARS */
-#endif  /* WIN32 */
-
-#if defined(DARWIN) || defined(_DARWIN)
-/* Mac OSX docs advise not to use sbrk; it seems better to use mmap */
-#ifndef HAVE_MORECORE
-#define HAVE_MORECORE 0
-#define HAVE_MMAP 1
-/* OSX allocators provide 16 byte alignment */
-#ifndef MALLOC_ALIGNMENT
-#define MALLOC_ALIGNMENT ((size_t)16U)
-#endif
-#endif  /* HAVE_MORECORE */
-#endif  /* DARWIN */
-
-#ifndef LACKS_SYS_TYPES_H
-#include <sys/types.h>  /* For size_t */
-#endif  /* LACKS_SYS_TYPES_H */
-
-/* The maximum possible size_t value has all bits set */
-#define MAX_SIZE_T           (~(size_t)0)
-
-#ifndef USE_LOCKS /* ensure true if spin or recursive locks set */
-#define USE_LOCKS  ((defined(USE_SPIN_LOCKS) && USE_SPIN_LOCKS != 0) || \
-                    (defined(USE_RECURSIVE_LOCKS) && USE_RECURSIVE_LOCKS != 0))
-#endif /* USE_LOCKS */
-
-#if USE_LOCKS /* Spin locks for gcc >= 4.1, older gcc on x86, MSC >= 1310 */
-#if ((defined(__GNUC__) &&                                              \
-      ((__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 1)) ||      \
-       defined(__i386__) || defined(__x86_64__))) ||                    \
-     (defined(_MSC_VER) && _MSC_VER>=1310))
-#ifndef USE_SPIN_LOCKS
-#define USE_SPIN_LOCKS 1
-#endif /* USE_SPIN_LOCKS */
-#elif USE_SPIN_LOCKS
-#error "USE_SPIN_LOCKS defined without implementation"
-#endif /* ... locks available... */
-#elif !defined(USE_SPIN_LOCKS)
-#define USE_SPIN_LOCKS 0
-#endif /* USE_LOCKS */
-
-#ifndef ONLY_MSPACES
-#define ONLY_MSPACES 0
-#endif  /* ONLY_MSPACES */
-#ifndef MSPACES
-#if ONLY_MSPACES
-#define MSPACES 1
-#else   /* ONLY_MSPACES */
-#define MSPACES 0
-#endif  /* ONLY_MSPACES */
-#endif  /* MSPACES */
-#ifndef MALLOC_ALIGNMENT
-#define MALLOC_ALIGNMENT ((size_t)(2 * sizeof(void *)))
-#endif  /* MALLOC_ALIGNMENT */
-#ifndef FOOTERS
-#define FOOTERS 0
-#endif  /* FOOTERS */
-#ifndef ABORT
-#define ABORT  abort()
-#endif  /* ABORT */
-#ifndef ABORT_ON_ASSERT_FAILURE
-#define ABORT_ON_ASSERT_FAILURE 1
-#endif  /* ABORT_ON_ASSERT_FAILURE */
-#ifndef PROCEED_ON_ERROR
-#define PROCEED_ON_ERROR 0
-#endif  /* PROCEED_ON_ERROR */
-
-#ifndef INSECURE
-#define INSECURE 0
-#endif  /* INSECURE */
-#ifndef MALLOC_INSPECT_ALL
-#define MALLOC_INSPECT_ALL 0
-#endif  /* MALLOC_INSPECT_ALL */
-#ifndef HAVE_MMAP
-#define HAVE_MMAP 1
-#endif  /* HAVE_MMAP */
-#ifndef MMAP_CLEARS
-#define MMAP_CLEARS 1
-#endif  /* MMAP_CLEARS */
-#ifndef HAVE_MREMAP
-#ifdef linux
-#define HAVE_MREMAP 1
-#define _GNU_SOURCE /* Turns on mremap() definition */
-#else   /* linux */
-#define HAVE_MREMAP 0
-#endif  /* linux */
-#endif  /* HAVE_MREMAP */
-#ifndef MALLOC_FAILURE_ACTION
-#define MALLOC_FAILURE_ACTION  errno = ENOMEM;
-#endif  /* MALLOC_FAILURE_ACTION */
-#ifndef HAVE_MORECORE
-#if ONLY_MSPACES
-#define HAVE_MORECORE 0
-#else   /* ONLY_MSPACES */
-#define HAVE_MORECORE 1
-#endif  /* ONLY_MSPACES */
-#endif  /* HAVE_MORECORE */
-#if !HAVE_MORECORE
-#define MORECORE_CONTIGUOUS 0
-#else   /* !HAVE_MORECORE */
-#define MORECORE_DEFAULT sbrk
-#ifndef MORECORE_CONTIGUOUS
-#define MORECORE_CONTIGUOUS 1
-#endif  /* MORECORE_CONTIGUOUS */
-#endif  /* HAVE_MORECORE */
-#ifndef DEFAULT_GRANULARITY
-#if (MORECORE_CONTIGUOUS || defined(WIN32))
-#define DEFAULT_GRANULARITY (0)  /* 0 means to compute in init_mparams */
-#else   /* MORECORE_CONTIGUOUS */
-#define DEFAULT_GRANULARITY ((size_t)64U * (size_t)1024U)
-#endif  /* MORECORE_CONTIGUOUS */
-#endif  /* DEFAULT_GRANULARITY */
-#ifndef DEFAULT_TRIM_THRESHOLD
-#ifndef MORECORE_CANNOT_TRIM
-#define DEFAULT_TRIM_THRESHOLD ((size_t)2U * (size_t)1024U * (size_t)1024U)
-#else   /* MORECORE_CANNOT_TRIM */
-#define DEFAULT_TRIM_THRESHOLD MAX_SIZE_T
-#endif  /* MORECORE_CANNOT_TRIM */
-#endif  /* DEFAULT_TRIM_THRESHOLD */
-#ifndef DEFAULT_MMAP_THRESHOLD
-#if HAVE_MMAP
-#define DEFAULT_MMAP_THRESHOLD ((size_t)256U * (size_t)1024U)
-#else   /* HAVE_MMAP */
-#define DEFAULT_MMAP_THRESHOLD MAX_SIZE_T
-#endif  /* HAVE_MMAP */
-#endif  /* DEFAULT_MMAP_THRESHOLD */
-#ifndef MAX_RELEASE_CHECK_RATE
-#if HAVE_MMAP
-#define MAX_RELEASE_CHECK_RATE 4095
-#else
-#define MAX_RELEASE_CHECK_RATE MAX_SIZE_T
-#endif /* HAVE_MMAP */
-#endif /* MAX_RELEASE_CHECK_RATE */
-#ifndef USE_BUILTIN_FFS
-#define USE_BUILTIN_FFS 0
-#endif  /* USE_BUILTIN_FFS */
-#ifndef USE_DEV_RANDOM
-#define USE_DEV_RANDOM 0
-#endif  /* USE_DEV_RANDOM */
-#ifndef NO_MALLINFO
-#define NO_MALLINFO 0
-#endif  /* NO_MALLINFO */
-#ifndef MALLINFO_FIELD_TYPE
-#define MALLINFO_FIELD_TYPE size_t
-#endif  /* MALLINFO_FIELD_TYPE */
-#ifndef NO_MALLOC_STATS
-#define NO_MALLOC_STATS 0
-#endif  /* NO_MALLOC_STATS */
-#ifndef NO_SEGMENT_TRAVERSAL
-#define NO_SEGMENT_TRAVERSAL 0
-#endif /* NO_SEGMENT_TRAVERSAL */
-
-/*
-  mallopt tuning options.  SVID/XPG defines four standard parameter
-  numbers for mallopt, normally defined in malloc.h.  None of these
-  are used in this malloc, so setting them has no effect. But this
-  malloc does support the following options.
-*/
-
-#define M_TRIM_THRESHOLD     (-1)
-#define M_GRANULARITY        (-2)
-#define M_MMAP_THRESHOLD     (-3)
-
-/* ------------------------ Mallinfo declarations ------------------------ */
-
-#if !NO_MALLINFO
-/*
-  This version of malloc supports the standard SVID/XPG mallinfo
-  routine that returns a struct containing usage properties and
-  statistics. It should work on any system that has a
-  /usr/include/malloc.h defining struct mallinfo.  The main
-  declaration needed is the mallinfo struct that is returned (by-copy)
-  by mallinfo().  The malloinfo struct contains a bunch of fields that
-  are not even meaningful in this version of malloc.  These fields are
-  are instead filled by mallinfo() with other numbers that might be of
-  interest.
-
-  HAVE_USR_INCLUDE_MALLOC_H should be set if you have a
-  /usr/include/malloc.h file that includes a declaration of struct
-  mallinfo.  If so, it is included; else a compliant version is
-  declared below.  These must be precisely the same for mallinfo() to
-  work.  The original SVID version of this struct, defined on most
-  systems with mallinfo, declares all fields as ints. But some others
-  define as unsigned long. If your system defines the fields using a
-  type of different width than listed here, you MUST #include your
-  system version and #define HAVE_USR_INCLUDE_MALLOC_H.
-*/
-
-/* #define HAVE_USR_INCLUDE_MALLOC_H */
-
-#ifdef HAVE_USR_INCLUDE_MALLOC_H
-#include "/usr/include/malloc.h"
-#else /* HAVE_USR_INCLUDE_MALLOC_H */
-#ifndef STRUCT_MALLINFO_DECLARED
-/* HP-UX (and others?) redefines mallinfo unless _STRUCT_MALLINFO is defined */
-#define _STRUCT_MALLINFO
-#define STRUCT_MALLINFO_DECLARED 1
-struct mallinfo {
-  MALLINFO_FIELD_TYPE arena;    /* non-mmapped space allocated from system */
-  MALLINFO_FIELD_TYPE ordblks;  /* number of free chunks */
-  MALLINFO_FIELD_TYPE smblks;   /* always 0 */
-  MALLINFO_FIELD_TYPE hblks;    /* always 0 */
-  MALLINFO_FIELD_TYPE hblkhd;   /* space in mmapped regions */
-  MALLINFO_FIELD_TYPE usmblks;  /* maximum total allocated space */
-  MALLINFO_FIELD_TYPE fsmblks;  /* always 0 */
-  MALLINFO_FIELD_TYPE uordblks; /* total allocated space */
-  MALLINFO_FIELD_TYPE fordblks; /* total free space */
-  MALLINFO_FIELD_TYPE keepcost; /* releasable (via malloc_trim) space */
-};
-#endif /* STRUCT_MALLINFO_DECLARED */
-#endif /* HAVE_USR_INCLUDE_MALLOC_H */
-#endif /* NO_MALLINFO */
-
-/*
-  Try to persuade compilers to inline. The most critical functions for
-  inlining are defined as macros, so these aren't used for them.
-*/
-
-#ifndef FORCEINLINE
-  #if defined(__GNUC__)
-#define FORCEINLINE __inline __attribute__ ((always_inline))
-  #elif defined(_MSC_VER)
-    #define FORCEINLINE __forceinline
-  #endif
-#endif
-#ifndef NOINLINE
-  #if defined(__GNUC__)
-    #define NOINLINE __attribute__ ((noinline))
-  #elif defined(_MSC_VER)
-    #define NOINLINE __declspec(noinline)
-  #else
-    #define NOINLINE
-  #endif
-#endif
-
-#ifdef __cplusplus
-extern "C" {
-#ifndef FORCEINLINE
- #define FORCEINLINE inline
-#endif
-#endif /* __cplusplus */
-#ifndef FORCEINLINE
- #define FORCEINLINE
-#endif
-
-#if !ONLY_MSPACES
-
-/* ------------------- Declarations of public routines ------------------- */
-
-#ifndef USE_DL_PREFIX
-#define dlcalloc               calloc
-#define dlfree                 free
-#define dlmalloc               malloc
-#define dlmemalign             memalign
-#define dlposix_memalign       posix_memalign
-#define dlrealloc              realloc
-#define dlrealloc_in_place     realloc_in_place
-#define dlvalloc               valloc
-#define dlpvalloc              pvalloc
-#define dlmallinfo             mallinfo
-#define dlmallopt              mallopt
-#define dlmalloc_trim          malloc_trim
-#define dlmalloc_stats         malloc_stats
-#define dlmalloc_usable_size   malloc_usable_size
-#define dlmalloc_footprint     malloc_footprint
-#define dlmalloc_max_footprint malloc_max_footprint
-#define dlmalloc_footprint_limit malloc_footprint_limit
-#define dlmalloc_set_footprint_limit malloc_set_footprint_limit
-#define dlmalloc_inspect_all   malloc_inspect_all
-#define dlindependent_calloc   independent_calloc
-#define dlindependent_comalloc independent_comalloc
-#define dlbulk_free            bulk_free
-#endif /* USE_DL_PREFIX */
-
-/*
-  malloc(size_t n)
-  Returns a pointer to a newly allocated chunk of at least n bytes, or
-  null if no space is available, in which case errno is set to ENOMEM
-  on ANSI C systems.
-
-  If n is zero, malloc returns a minimum-sized chunk. (The minimum
-  size is 16 bytes on most 32bit systems, and 32 bytes on 64bit
-  systems.)  Note that size_t is an unsigned type, so calls with
-  arguments that would be negative if signed are interpreted as
-  requests for huge amounts of space, which will often fail. The
-  maximum supported value of n differs across systems, but is in all
-  cases less than the maximum representable value of a size_t.
-*/
-DLMALLOC_EXPORT void* dlmalloc(size_t);
-
-/*
-  free(void* p)
-  Releases the chunk of memory pointed to by p, that had been previously
-  allocated using malloc or a related routine such as realloc.
-  It has no effect if p is null. If p was not malloced or already
-  freed, free(p) will by default cause the current program to abort.
-*/
-DLMALLOC_EXPORT void  dlfree(void*);
-
-/*
-  calloc(size_t n_elements, size_t element_size);
-  Returns a pointer to n_elements * element_size bytes, with all locations
-  set to zero.
-*/
-DLMALLOC_EXPORT void* dlcalloc(size_t, size_t);
-
-/*
-  realloc(void* p, size_t n)
-  Returns a pointer to a chunk of size n that contains the same data
-  as does chunk p up to the minimum of (n, p's size) bytes, or null
-  if no space is available.
-
-  The returned pointer may or may not be the same as p. The algorithm
-  prefers extending p in most cases when possible, otherwise it
-  employs the equivalent of a malloc-copy-free sequence.
-
-  If p is null, realloc is equivalent to malloc.
-
-  If space is not available, realloc returns null, errno is set (if on
-  ANSI) and p is NOT freed.
-
-  if n is for fewer bytes than already held by p, the newly unused
-  space is lopped off and freed if possible.  realloc with a size
-  argument of zero (re)allocates a minimum-sized chunk.
-
-  The old unix realloc convention of allowing the last-free'd chunk
-  to be used as an argument to realloc is not supported.
-*/
-DLMALLOC_EXPORT void* dlrealloc(void*, size_t);
-
-/*
-  realloc_in_place(void* p, size_t n)
-  Resizes the space allocated for p to size n, only if this can be
-  done without moving p (i.e., only if there is adjacent space
-  available if n is greater than p's current allocated size, or n is
-  less than or equal to p's size). This may be used instead of plain
-  realloc if an alternative allocation strategy is needed upon failure
-  to expand space; for example, reallocation of a buffer that must be
-  memory-aligned or cleared. You can use realloc_in_place to trigger
-  these alternatives only when needed.
-
-  Returns p if successful; otherwise null.
-*/
-DLMALLOC_EXPORT void* dlrealloc_in_place(void*, size_t);
-
-/*
-  memalign(size_t alignment, size_t n);
-  Returns a pointer to a newly allocated chunk of n bytes, aligned
-  in accord with the alignment argument.
-
-  The alignment argument should be a power of two. If the argument is
-  not a power of two, the nearest greater power is used.
-  8-byte alignment is guaranteed by normal malloc calls, so don't
-  bother calling memalign with an argument of 8 or less.
-
-  Overreliance on memalign is a sure way to fragment space.
-*/
-DLMALLOC_EXPORT void* dlmemalign(size_t, size_t);
-
-/*
-  int posix_memalign(void** pp, size_t alignment, size_t n);
-  Allocates a chunk of n bytes, aligned in accord with the alignment
-  argument. Differs from memalign only in that it (1) assigns the
-  allocated memory to *pp rather than returning it, (2) fails and
-  returns EINVAL if the alignment is not a power of two (3) fails and
-  returns ENOMEM if memory cannot be allocated.
-*/
-DLMALLOC_EXPORT int dlposix_memalign(void**, size_t, size_t);
-
-/*
-  valloc(size_t n);
-  Equivalent to memalign(pagesize, n), where pagesize is the page
-  size of the system. If the pagesize is unknown, 4096 is used.
-*/
-DLMALLOC_EXPORT void* dlvalloc(size_t);
-
-/*
-  mallopt(int parameter_number, int parameter_value)
-  Sets tunable parameters The format is to provide a
-  (parameter-number, parameter-value) pair.  mallopt then sets the
-  corresponding parameter to the argument value if it can (i.e., so
-  long as the value is meaningful), and returns 1 if successful else
-  0.  To workaround the fact that mallopt is specified to use int,
-  not size_t parameters, the value -1 is specially treated as the
-  maximum unsigned size_t value.
-
-  SVID/XPG/ANSI defines four standard param numbers for mallopt,
-  normally defined in malloc.h.  None of these are use in this malloc,
-  so setting them has no effect. But this malloc also supports other
-  options in mallopt. See below for details.  Briefly, supported
-  parameters are as follows (listed defaults are for "typical"
-  configurations).
-
-  Symbol            param #  default    allowed param values
-  M_TRIM_THRESHOLD     -1   2*1024*1024   any   (-1 disables)
-  M_GRANULARITY        -2     page size   any power of 2 >= page size
-  M_MMAP_THRESHOLD     -3      256*1024   any   (or 0 if no MMAP support)
-*/
-DLMALLOC_EXPORT int dlmallopt(int, int);
-
-/*
-  malloc_footprint();
-  Returns the number of bytes obtained from the system.  The total
-  number of bytes allocated by malloc, realloc etc., is less than this
-  value. Unlike mallinfo, this function returns only a precomputed
-  result, so can be called frequently to monitor memory consumption.
-  Even if locks are otherwise defined, this function does not use them,
-  so results might not be up to date.
-*/
-DLMALLOC_EXPORT size_t dlmalloc_footprint(void);
-
-/*
-  malloc_max_footprint();
-  Returns the maximum number of bytes obtained from the system. This
-  value will be greater than current footprint if deallocated space
-  has been reclaimed by the system. The peak number of bytes allocated
-  by malloc, realloc etc., is less than this value. Unlike mallinfo,
-  this function returns only a precomputed result, so can be called
-  frequently to monitor memory consumption.  Even if locks are
-  otherwise defined, this function does not use them, so results might
-  not be up to date.
-*/
-DLMALLOC_EXPORT size_t dlmalloc_max_footprint(void);
-
-/*
-  malloc_footprint_limit();
-  Returns the number of bytes that the heap is allowed to obtain from
-  the system, returning the last value returned by
-  malloc_set_footprint_limit, or the maximum size_t value if
-  never set. The returned value reflects a permission. There is no
-  guarantee that this number of bytes can actually be obtained from
-  the system.
-*/
-DLMALLOC_EXPORT size_t dlmalloc_footprint_limit();
-
-/*
-  malloc_set_footprint_limit();
-  Sets the maximum number of bytes to obtain from the system, causing
-  failure returns from malloc and related functions upon attempts to
-  exceed this value. The argument value may be subject to page
-  rounding to an enforceable limit; this actual value is returned.
-  Using an argument of the maximum possible size_t effectively
-  disables checks. If the argument is less than or equal to the
-  current malloc_footprint, then all future allocations that require
-  additional system memory will fail. However, invocation cannot
-  retroactively deallocate existing used memory.
-*/
-DLMALLOC_EXPORT size_t dlmalloc_set_footprint_limit(size_t bytes);
-
-#if MALLOC_INSPECT_ALL
-/*
-  malloc_inspect_all(void(*handler)(void *start,
-                                    void *end,
-                                    size_t used_bytes,
-                                    void* callback_arg),
-                      void* arg);
-  Traverses the heap and calls the given handler for each managed
-  region, skipping all bytes that are (or may be) used for bookkeeping
-  purposes.  Traversal does not include include chunks that have been
-  directly memory mapped. Each reported region begins at the start
-  address, and continues up to but not including the end address.  The
-  first used_bytes of the region contain allocated data. If
-  used_bytes is zero, the region is unallocated. The handler is
-  invoked with the given callback argument. If locks are defined, they
-  are held during the entire traversal. It is a bad idea to invoke
-  other malloc functions from within the handler.
-
-  For example, to count the number of in-use chunks with size greater
-  than 1000, you could write:
-  static int count = 0;
-  void count_chunks(void* start, void* end, size_t used, void* arg) {
-    if (used >= 1000) ++count;
-  }
-  then:
-    malloc_inspect_all(count_chunks, NULL);
-
-  malloc_inspect_all is compiled only if MALLOC_INSPECT_ALL is defined.
-*/
-DLMALLOC_EXPORT void dlmalloc_inspect_all(void(*handler)(void*, void *, size_t, void*),
-                           void* arg);
-
-#endif /* MALLOC_INSPECT_ALL */
-
-#if !NO_MALLINFO
-/*
-  mallinfo()
-  Returns (by copy) a struct containing various summary statistics:
-
-  arena:     current total non-mmapped bytes allocated from system
-  ordblks:   the number of free chunks
-  smblks:    always zero.
-  hblks:     current number of mmapped regions
-  hblkhd:    total bytes held in mmapped regions
-  usmblks:   the maximum total allocated space. This will be greater
-                than current total if trimming has occurred.
-  fsmblks:   always zero
-  uordblks:  current total allocated space (normal or mmapped)
-  fordblks:  total free space
-  keepcost:  the maximum number of bytes that could ideally be released
-               back to system via malloc_trim. ("ideally" means that
-               it ignores page restrictions etc.)
-
-  Because these fields are ints, but internal bookkeeping may
-  be kept as longs, the reported values may wrap around zero and
-  thus be inaccurate.
-*/
-DLMALLOC_EXPORT struct mallinfo dlmallinfo(void);
-#endif /* NO_MALLINFO */
-
-/*
-  independent_calloc(size_t n_elements, size_t element_size, void* chunks[]);
-
-  independent_calloc is similar to calloc, but instead of returning a
-  single cleared space, it returns an array of pointers to n_elements
-  independent elements that can hold contents of size elem_size, each
-  of which starts out cleared, and can be independently freed,
-  realloc'ed etc. The elements are guaranteed to be adjacently
-  allocated (this is not guaranteed to occur with multiple callocs or
-  mallocs), which may also improve cache locality in some
-  applications.
-
-  The "chunks" argument is optional (i.e., may be null, which is
-  probably the most typical usage). If it is null, the returned array
-  is itself dynamically allocated and should also be freed when it is
-  no longer needed. Otherwise, the chunks array must be of at least
-  n_elements in length. It is filled in with the pointers to the
-  chunks.
-
-  In either case, independent_calloc returns this pointer array, or
-  null if the allocation failed.  If n_elements is zero and "chunks"
-  is null, it returns a chunk representing an array with zero elements
-  (which should be freed if not wanted).
-
-  Each element must be freed when it is no longer needed. This can be
-  done all at once using bulk_free.
-
-  independent_calloc simplifies and speeds up implementations of many
-  kinds of pools.  It may also be useful when constructing large data
-  structures that initially have a fixed number of fixed-sized nodes,
-  but the number is not known at compile time, and some of the nodes
-  may later need to be freed. For example:
-
-  struct Node { int item; struct Node* next; };
-
-  struct Node* build_list() {
-    struct Node** pool;
-    int n = read_number_of_nodes_needed();
-    if (n <= 0) return 0;
-    pool = (struct Node**)(independent_calloc(n, sizeof(struct Node), 0);
-    if (pool == 0) die();
-    // organize into a linked list...
-    struct Node* first = pool[0];
-    for (i = 0; i < n-1; ++i)
-      pool[i]->next = pool[i+1];
-    free(pool);     // Can now free the array (or not, if it is needed later)
-    return first;
-  }
-*/
-DLMALLOC_EXPORT void** dlindependent_calloc(size_t, size_t, void**);
-
-/*
-  independent_comalloc(size_t n_elements, size_t sizes[], void* chunks[]);
-
-  independent_comalloc allocates, all at once, a set of n_elements
-  chunks with sizes indicated in the "sizes" array.    It returns
-  an array of pointers to these elements, each of which can be
-  independently freed, realloc'ed etc. The elements are guaranteed to
-  be adjacently allocated (this is not guaranteed to occur with
-  multiple callocs or mallocs), which may also improve cache locality
-  in some applications.
-
-  The "chunks" argument is optional (i.e., may be null). If it is null
-  the returned array is itself dynamically allocated and should also
-  be freed when it is no longer needed. Otherwise, the chunks array
-  must be of at least n_elements in length. It is filled in with the
-  pointers to the chunks.
-
-  In either case, independent_comalloc returns this pointer array, or
-  null if the allocation failed.  If n_elements is zero and chunks is
-  null, it returns a chunk representing an array with zero elements
-  (which should be freed if not wanted).
-
-  Each element must be freed when it is no longer needed. This can be
-  done all at once using bulk_free.
-
-  independent_comallac differs from independent_calloc in that each
-  element may have a different size, and also that it does not
-  automatically clear elements.
-
-  independent_comalloc can be used to speed up allocation in cases
-  where several structs or objects must always be allocated at the
-  same time.  For example:
-
-  struct Head { ... }
-  struct Foot { ... }
-
-  void send_message(char* msg) {
-    int msglen = strlen(msg);
-    size_t sizes[3] = { sizeof(struct Head), msglen, sizeof(struct Foot) };
-    void* chunks[3];
-    if (independent_comalloc(3, sizes, chunks) == 0)
-      die();
-    struct Head* head = (struct Head*)(chunks[0]);
-    char*        body = (char*)(chunks[1]);
-    struct Foot* foot = (struct Foot*)(chunks[2]);
-    // ...
-  }
-
-  In general though, independent_comalloc is worth using only for
-  larger values of n_elements. For small values, you probably won't
-  detect enough difference from series of malloc calls to bother.
-
-  Overuse of independent_comalloc can increase overall memory usage,
-  since it cannot reuse existing noncontiguous small chunks that
-  might be available for some of the elements.
-*/
-DLMALLOC_EXPORT void** dlindependent_comalloc(size_t, size_t*, void**);
-
-/*
-  bulk_free(void* array[], size_t n_elements)
-  Frees and clears (sets to null) each non-null pointer in the given
-  array.  This is likely to be faster than freeing them one-by-one.
-  If footers are used, pointers that have been allocated in different
-  mspaces are not freed or cleared, and the count of all such pointers
-  is returned.  For large arrays of pointers with poor locality, it
-  may be worthwhile to sort this array before calling bulk_free.
-*/
-DLMALLOC_EXPORT size_t  dlbulk_free(void**, size_t n_elements);
-
-/*
-  pvalloc(size_t n);
-  Equivalent to valloc(minimum-page-that-holds(n)), that is,
-  round up n to nearest pagesize.
- */
-DLMALLOC_EXPORT void*  dlpvalloc(size_t);
-
-/*
-  malloc_trim(size_t pad);
-
-  If possible, gives memory back to the system (via negative arguments
-  to sbrk) if there is unused memory at the `high' end of the malloc
-  pool or in unused MMAP segments. You can call this after freeing
-  large blocks of memory to potentially reduce the system-level memory
-  requirements of a program. However, it cannot guarantee to reduce
-  memory. Under some allocation patterns, some large free blocks of
-  memory will be locked between two used chunks, so they cannot be
-  given back to the system.
-
-  The `pad' argument to malloc_trim represents the amount of free
-  trailing space to leave untrimmed. If this argument is zero, only
-  the minimum amount of memory to maintain internal data structures
-  will be left. Non-zero arguments can be supplied to maintain enough
-  trailing space to service future expected allocations without having
-  to re-obtain memory from the system.
-
-  Malloc_trim returns 1 if it actually released any memory, else 0.
-*/
-DLMALLOC_EXPORT int  dlmalloc_trim(size_t);
-
-/*
-  malloc_stats();
-  Prints on stderr the amount of space obtained from the system (both
-  via sbrk and mmap), the maximum amount (which may be more than
-  current if malloc_trim and/or munmap got called), and the current
-  number of bytes allocated via malloc (or realloc, etc) but not yet
-  freed. Note that this is the number of bytes allocated, not the
-  number requested. It will be larger than the number requested
-  because of alignment and bookkeeping overhead. Because it includes
-  alignment wastage as being in use, this figure may be greater than
-  zero even when no user-level chunks are allocated.
-
-  The reported current and maximum system memory can be inaccurate if
-  a program makes other calls to system memory allocation functions
-  (normally sbrk) outside of malloc.
-
-  malloc_stats prints only the most commonly interesting statistics.
-  More information can be obtained by calling mallinfo.
-*/
-DLMALLOC_EXPORT void  dlmalloc_stats(void);
-
-/*
-  malloc_usable_size(void* p);
-
-  Returns the number of bytes you can actually use in
-  an allocated chunk, which may be more than you requested (although
-  often not) due to alignment and minimum size constraints.
-  You can use this many bytes without worrying about
-  overwriting other allocated objects. This is not a particularly great
-  programming practice. malloc_usable_size can be more useful in
-  debugging and assertions, for example:
-
-  p = malloc(n);
-  assert(malloc_usable_size(p) >= 256);
-*/
-size_t dlmalloc_usable_size(void*);
-
-#endif /* ONLY_MSPACES */
-
-#if MSPACES
-
-/*
-  mspace is an opaque type representing an independent
-  region of space that supports mspace_malloc, etc.
-*/
-typedef void* mspace;
-
-/*
-  create_mspace creates and returns a new independent space with the
-  given initial capacity, or, if 0, the default granularity size.  It
-  returns null if there is no system memory available to create the
-  space.  If argument locked is non-zero, the space uses a separate
-  lock to control access. The capacity of the space will grow
-  dynamically as needed to service mspace_malloc requests.  You can
-  control the sizes of incremental increases of this space by
-  compiling with a different DEFAULT_GRANULARITY or dynamically
-  setting with mallopt(M_GRANULARITY, value).
-*/
-DLMALLOC_EXPORT mspace create_mspace(size_t capacity, int locked);
-
-/*
-  destroy_mspace destroys the given space, and attempts to return all
-  of its memory back to the system, returning the total number of
-  bytes freed. After destruction, the results of access to all memory
-  used by the space become undefined.
-*/
-DLMALLOC_EXPORT size_t destroy_mspace(mspace msp);
-
-/*
-  create_mspace_with_base uses the memory supplied as the initial base
-  of a new mspace. Part (less than 128*sizeof(size_t) bytes) of this
-  space is used for bookkeeping, so the capacity must be at least this
-  large. (Otherwise 0 is returned.) When this initial space is
-  exhausted, additional memory will be obtained from the system.
-  Destroying this space will deallocate all additionally allocated
-  space (if possible) but not the initial base.
-*/
-DLMALLOC_EXPORT mspace create_mspace_with_base(void* base, size_t capacity, int locked);
-
-/*
-  mspace_track_large_chunks controls whether requests for large chunks
-  are allocated in their own untracked mmapped regions, separate from
-  others in this mspace. By default large chunks are not tracked,
-  which reduces fragmentation. However, such chunks are not
-  necessarily released to the system upon destroy_mspace.  Enabling
-  tracking by setting to true may increase fragmentation, but avoids
-  leakage when relying on destroy_mspace to release all memory
-  allocated using this space.  The function returns the previous
-  setting.
-*/
-DLMALLOC_EXPORT int mspace_track_large_chunks(mspace msp, int enable);
-
-
-/*
-  mspace_malloc behaves as malloc, but operates within
-  the given space.
-*/
-DLMALLOC_EXPORT void* mspace_malloc(mspace msp, size_t bytes);
-
-/*
-  mspace_free behaves as free, but operates within
-  the given space.
-
-  If compiled with FOOTERS==1, mspace_free is not actually needed.
-  free may be called instead of mspace_free because freed chunks from
-  any space are handled by their originating spaces.
-*/
-DLMALLOC_EXPORT void mspace_free(mspace msp, void* mem);
-
-/*
-  mspace_realloc behaves as realloc, but operates within
-  the given space.
-
-  If compiled with FOOTERS==1, mspace_realloc is not actually
-  needed.  realloc may be called instead of mspace_realloc because
-  realloced chunks from any space are handled by their originating
-  spaces.
-*/
-DLMALLOC_EXPORT void* mspace_realloc(mspace msp, void* mem, size_t newsize);
-
-/*
-  mspace_calloc behaves as calloc, but operates within
-  the given space.
-*/
-DLMALLOC_EXPORT void* mspace_calloc(mspace msp, size_t n_elements, size_t elem_size);
-
-/*
-  mspace_memalign behaves as memalign, but operates within
-  the given space.
-*/
-DLMALLOC_EXPORT void* mspace_memalign(mspace msp, size_t alignment, size_t bytes);
-
-/*
-  mspace_independent_calloc behaves as independent_calloc, but
-  operates within the given space.
-*/
-DLMALLOC_EXPORT void** mspace_independent_calloc(mspace msp, size_t n_elements,
-                                 size_t elem_size, void* chunks[]);
-
-/*
-  mspace_independent_comalloc behaves as independent_comalloc, but
-  operates within the given space.
-*/
-DLMALLOC_EXPORT void** mspace_independent_comalloc(mspace msp, size_t n_elements,
-                                   size_t sizes[], void* chunks[]);
-
-/*
-  mspace_footprint() returns the number of bytes obtained from the
-  system for this space.
-*/
-DLMALLOC_EXPORT size_t mspace_footprint(mspace msp);
-
-/*
-  mspace_max_footprint() returns the peak number of bytes obtained from the
-  system for this space.
-*/
-DLMALLOC_EXPORT size_t mspace_max_footprint(mspace msp);
-
-
-#if !NO_MALLINFO
-/*
-  mspace_mallinfo behaves as mallinfo, but reports properties of
-  the given space.
-*/
-DLMALLOC_EXPORT struct mallinfo mspace_mallinfo(mspace msp);
-#endif /* NO_MALLINFO */
-
-/*
-  malloc_usable_size(void* p) behaves the same as malloc_usable_size;
-*/
-DLMALLOC_EXPORT size_t mspace_usable_size(const void* mem);
-
-/*
-  mspace_malloc_stats behaves as malloc_stats, but reports
-  properties of the given space.
-*/
-DLMALLOC_EXPORT void mspace_malloc_stats(mspace msp);
-
-/*
-  mspace_trim behaves as malloc_trim, but
-  operates within the given space.
-*/
-DLMALLOC_EXPORT int mspace_trim(mspace msp, size_t pad);
-
-/*
-  An alias for mallopt.
-*/
-DLMALLOC_EXPORT int mspace_mallopt(int, int);
-
-#endif /* MSPACES */
-
-#ifdef __cplusplus
-}  /* end of extern "C" */
-#endif /* __cplusplus */
-
-/*
-  ========================================================================
-  To make a fully customizable malloc.h header file, cut everything
-  above this line, put into file malloc.h, edit to suit, and #include it
-  on the next line, as well as in programs that use this malloc.
-  ========================================================================
-*/
-
-/* #include "malloc.h" */
-
-/*------------------------------ internal #includes ---------------------- */
-
-#ifdef _MSC_VER
-#pragma warning( disable : 4146 ) /* no "unsigned" warnings */
-#endif /* _MSC_VER */
-#if !NO_MALLOC_STATS
-#include <stdio.h>       /* for printing in malloc_stats */
-#endif /* NO_MALLOC_STATS */
-#ifndef LACKS_ERRNO_H
-#include <errno.h>       /* for MALLOC_FAILURE_ACTION */
-#endif /* LACKS_ERRNO_H */
-#ifdef DEBUG
-#if ABORT_ON_ASSERT_FAILURE
-#undef assert
-#define assert(x) if(!(x)) ABORT
-#else /* ABORT_ON_ASSERT_FAILURE */
-#include <assert.h>
-#endif /* ABORT_ON_ASSERT_FAILURE */
-#else  /* DEBUG */
-#ifndef assert
-#define assert(x)
-#endif
-#define DEBUG 0
-#endif /* DEBUG */
-#if !defined(WIN32) && !defined(LACKS_TIME_H)
-#include <time.h>        /* for magic initialization */
-#endif /* WIN32 */
-#ifndef LACKS_STDLIB_H
-#include <stdlib.h>      /* for abort() */
-#endif /* LACKS_STDLIB_H */
-#ifndef LACKS_STRING_H
-#include <string.h>      /* for memset etc */
-#endif  /* LACKS_STRING_H */
-#if USE_BUILTIN_FFS
-#ifndef LACKS_STRINGS_H
-#include <strings.h>     /* for ffs */
-#endif /* LACKS_STRINGS_H */
-#endif /* USE_BUILTIN_FFS */
-#if HAVE_MMAP
-#ifndef LACKS_SYS_MMAN_H
-/* On some versions of linux, mremap decl in mman.h needs __USE_GNU set */
-#if (defined(linux) && !defined(__USE_GNU))
-#define __USE_GNU 1
-#include <sys/mman.h>    /* for mmap */
-#undef __USE_GNU
-#else
-#include <sys/mman.h>    /* for mmap */
-#endif /* linux */
-#endif /* LACKS_SYS_MMAN_H */
-#ifndef LACKS_FCNTL_H
-#include <fcntl.h>
-#endif /* LACKS_FCNTL_H */
-#endif /* HAVE_MMAP */
-#ifndef LACKS_UNISTD_H
-#include <unistd.h>     /* for sbrk, sysconf */
-#else /* LACKS_UNISTD_H */
-#if !defined(__FreeBSD__) && !defined(__OpenBSD__) && !defined(__NetBSD__)
-extern void*     sbrk(ptrdiff_t);
-#endif /* FreeBSD etc */
-#endif /* LACKS_UNISTD_H */
-
-/* Declarations for locking */
-#if USE_LOCKS
-#ifndef WIN32
-#if defined (__SVR4) && defined (__sun)  /* solaris */
-#include <thread.h>
-#elif !defined(LACKS_SCHED_H)
-#include <sched.h>
-#endif /* solaris or LACKS_SCHED_H */
-#if (defined(USE_RECURSIVE_LOCKS) && USE_RECURSIVE_LOCKS != 0) || !USE_SPIN_LOCKS
-#include <pthread.h>
-#endif /* USE_RECURSIVE_LOCKS ... */
-#elif defined(_MSC_VER)
-#ifndef _M_AMD64
-/* These are already defined on AMD64 builds */
-#ifdef __cplusplus
-extern "C" {
-#endif /* __cplusplus */
-LONG __cdecl _InterlockedCompareExchange(LONG volatile *Dest, LONG Exchange, LONG Comp);
-LONG __cdecl _InterlockedExchange(LONG volatile *Target, LONG Value);
-#ifdef __cplusplus
-}
-#endif /* __cplusplus */
-#endif /* _M_AMD64 */
-#pragma intrinsic (_InterlockedCompareExchange)
-#pragma intrinsic (_InterlockedExchange)
-#define interlockedcompareexchange _InterlockedCompareExchange
-#define interlockedexchange _InterlockedExchange
-#elif defined(WIN32) && defined(__GNUC__)
-#define interlockedcompareexchange(a, b, c) __sync_val_compare_and_swap(a, c, b)
-#define interlockedexchange __sync_lock_test_and_set
-#endif /* Win32 */
-#else /* USE_LOCKS */
-#endif /* USE_LOCKS */
-
-#ifndef LOCK_AT_FORK
-#define LOCK_AT_FORK 0
-#endif
-
-/* Declarations for bit scanning on win32 */
-#if defined(_MSC_VER) && _MSC_VER>=1300
-#ifndef BitScanForward /* Try to avoid pulling in WinNT.h */
-#ifdef __cplusplus
-extern "C" {
-#endif /* __cplusplus */
-unsigned char _BitScanForward(unsigned long *index, unsigned long mask);
-unsigned char _BitScanReverse(unsigned long *index, unsigned long mask);
-#ifdef __cplusplus
-}
-#endif /* __cplusplus */
-
-#define BitScanForward _BitScanForward
-#define BitScanReverse _BitScanReverse
-#pragma intrinsic(_BitScanForward)
-#pragma intrinsic(_BitScanReverse)
-#endif /* BitScanForward */
-#endif /* defined(_MSC_VER) && _MSC_VER>=1300 */
-
-#ifndef WIN32
-#ifndef malloc_getpagesize
-#  ifdef _SC_PAGESIZE         /* some SVR4 systems omit an underscore */
-#    ifndef _SC_PAGE_SIZE
-#      define _SC_PAGE_SIZE _SC_PAGESIZE
-#    endif
-#  endif
-#  ifdef _SC_PAGE_SIZE
-#    define malloc_getpagesize sysconf(_SC_PAGE_SIZE)
-#  else
-#    if defined(BSD) || defined(DGUX) || defined(HAVE_GETPAGESIZE)
-       extern size_t getpagesize();
-#      define malloc_getpagesize getpagesize()
-#    else
-#      ifdef WIN32 /* use supplied emulation of getpagesize */
-#        define malloc_getpagesize getpagesize()
-#      else
-#        ifndef LACKS_SYS_PARAM_H
-#          include <sys/param.h>
-#        endif
-#        ifdef EXEC_PAGESIZE
-#          define malloc_getpagesize EXEC_PAGESIZE
-#        else
-#          ifdef NBPG
-#            ifndef CLSIZE
-#              define malloc_getpagesize NBPG
-#            else
-#              define malloc_getpagesize (NBPG * CLSIZE)
-#            endif
-#          else
-#            ifdef NBPC
-#              define malloc_getpagesize NBPC
-#            else
-#              ifdef PAGESIZE
-#                define malloc_getpagesize PAGESIZE
-#              else /* just guess */
-#                define malloc_getpagesize ((size_t)4096U)
-#              endif
-#            endif
-#          endif
-#        endif
-#      endif
-#    endif
-#  endif
-#endif
-#endif
-
-/* ------------------- size_t and alignment properties -------------------- */
-
-/* The byte and bit size of a size_t */
-#define SIZE_T_SIZE         (sizeof(size_t))
-#define SIZE_T_BITSIZE      (sizeof(size_t) << 3)
-
-/* Some constants coerced to size_t */
-/* Annoying but necessary to avoid errors on some platforms */
-#define SIZE_T_ZERO         ((size_t)0)
-#define SIZE_T_ONE          ((size_t)1)
-#define SIZE_T_TWO          ((size_t)2)
-#define SIZE_T_FOUR         ((size_t)4)
-#define TWO_SIZE_T_SIZES    (SIZE_T_SIZE<<1)
-#define FOUR_SIZE_T_SIZES   (SIZE_T_SIZE<<2)
-#define SIX_SIZE_T_SIZES    (FOUR_SIZE_T_SIZES+TWO_SIZE_T_SIZES)
-#define HALF_MAX_SIZE_T     (MAX_SIZE_T / 2U)
-
-/* The bit mask value corresponding to MALLOC_ALIGNMENT */
-#define CHUNK_ALIGN_MASK    (MALLOC_ALIGNMENT - SIZE_T_ONE)
-
-/* True if address a has acceptable alignment */
-#define is_aligned(A)       (((size_t)((A)) & (CHUNK_ALIGN_MASK)) == 0)
-
-/* the number of bytes to offset an address to align it */
-#define align_offset(A)\
- ((((size_t)(A) & CHUNK_ALIGN_MASK) == 0)? 0 :\
-  ((MALLOC_ALIGNMENT - ((size_t)(A) & CHUNK_ALIGN_MASK)) & CHUNK_ALIGN_MASK))
-
-/* -------------------------- MMAP preliminaries ------------------------- */
-
-/*
-   If HAVE_MORECORE or HAVE_MMAP are false, we just define calls and
-   checks to fail so compiler optimizer can delete code rather than
-   using so many "#if"s.
-*/
-
-
-/* MORECORE and MMAP must return MFAIL on failure */
-#define MFAIL                ((void*)(MAX_SIZE_T))
-#define CMFAIL               ((char*)(MFAIL)) /* defined for convenience */
-
-#if HAVE_MMAP
-
-#ifndef WIN32
-#define MUNMAP_DEFAULT(a, s)  munmap((a), (s))
-#define MMAP_PROT            (PROT_READ|PROT_WRITE)
-#if !defined(MAP_ANONYMOUS) && defined(MAP_ANON)
-#define MAP_ANONYMOUS        MAP_ANON
-#endif /* MAP_ANON */
-#ifdef MAP_ANONYMOUS
-#define MMAP_FLAGS           (MAP_PRIVATE|MAP_ANONYMOUS)
-#define MMAP_DEFAULT(s)       mmap(0, (s), MMAP_PROT, MMAP_FLAGS, -1, 0)
-#else /* MAP_ANONYMOUS */
-/*
-   Nearly all versions of mmap support MAP_ANONYMOUS, so the following
-   is unlikely to be needed, but is supplied just in case.
-*/
-#define MMAP_FLAGS           (MAP_PRIVATE)
-static int dev_zero_fd = -1; /* Cached file descriptor for /dev/zero. */
-#define MMAP_DEFAULT(s) ((dev_zero_fd < 0) ? \
-           (dev_zero_fd = open("/dev/zero", O_RDWR), \
-            mmap(0, (s), MMAP_PROT, MMAP_FLAGS, dev_zero_fd, 0)) : \
-            mmap(0, (s), MMAP_PROT, MMAP_FLAGS, dev_zero_fd, 0))
-#endif /* MAP_ANONYMOUS */
-
-#define DIRECT_MMAP_DEFAULT(s) MMAP_DEFAULT(s)
-
-#else /* WIN32 */
-
-/* Win32 MMAP via VirtualAlloc */
-static FORCEINLINE void* win32mmap(size_t size) {
-  void* ptr = VirtualAlloc(0, size, MEM_RESERVE|MEM_COMMIT, PAGE_READWRITE);
-  return (ptr != 0)? ptr: MFAIL;
-}
-
-/* For direct MMAP, use MEM_TOP_DOWN to minimize interference */
-static FORCEINLINE void* win32direct_mmap(size_t size) {
-  void* ptr = VirtualAlloc(0, size, MEM_RESERVE|MEM_COMMIT|MEM_TOP_DOWN,
-                           PAGE_READWRITE);
-  return (ptr != 0)? ptr: MFAIL;
-}
-
-/* This function supports releasing coalesed segments */
-static FORCEINLINE int win32munmap(void* ptr, size_t size) {
-  MEMORY_BASIC_INFORMATION minfo;
-  char* cptr = (char*)ptr;
-  while (size) {
-    if (VirtualQuery(cptr, &minfo, sizeof(minfo)) == 0)
-      return -1;
-    if (minfo.BaseAddress != cptr || minfo.AllocationBase != cptr ||
-        minfo.State != MEM_COMMIT || minfo.RegionSize > size)
-      return -1;
-    if (VirtualFree(cptr, 0, MEM_RELEASE) == 0)
-      return -1;
-    cptr += minfo.RegionSize;
-    size -= minfo.RegionSize;
-  }
-  return 0;
-}
-
-#define MMAP_DEFAULT(s)             win32mmap(s)
-#define MUNMAP_DEFAULT(a, s)        win32munmap((a), (s))
-#define DIRECT_MMAP_DEFAULT(s)      win32direct_mmap(s)
-#endif /* WIN32 */
-#endif /* HAVE_MMAP */
-
-#if HAVE_MREMAP
-#ifndef WIN32
-#define MREMAP_DEFAULT(addr, osz, nsz, mv) mremap((addr), (osz), (nsz), (mv))
-#endif /* WIN32 */
-#endif /* HAVE_MREMAP */
-
-/**
- * Define CALL_MORECORE
- */
-#if HAVE_MORECORE
-    #ifdef MORECORE
-        #define CALL_MORECORE(S)    MORECORE(S)
-    #else  /* MORECORE */
-        #define CALL_MORECORE(S)    MORECORE_DEFAULT(S)
-    #endif /* MORECORE */
-#else  /* HAVE_MORECORE */
-    #define CALL_MORECORE(S)        MFAIL
-#endif /* HAVE_MORECORE */
-
-/**
- * Define CALL_MMAP/CALL_MUNMAP/CALL_DIRECT_MMAP
- */
-#if HAVE_MMAP
-    #define USE_MMAP_BIT            (SIZE_T_ONE)
-
-    #ifdef MMAP
-        #define CALL_MMAP(s)        MMAP(s)
-    #else /* MMAP */
-        #define CALL_MMAP(s)        MMAP_DEFAULT(s)
-    #endif /* MMAP */
-    #ifdef MUNMAP
-        #define CALL_MUNMAP(a, s)   MUNMAP((a), (s))
-    #else /* MUNMAP */
-        #define CALL_MUNMAP(a, s)   MUNMAP_DEFAULT((a), (s))
-    #endif /* MUNMAP */
-    #ifdef DIRECT_MMAP
-        #define CALL_DIRECT_MMAP(s) DIRECT_MMAP(s)
-    #else /* DIRECT_MMAP */
-        #define CALL_DIRECT_MMAP(s) DIRECT_MMAP_DEFAULT(s)
-    #endif /* DIRECT_MMAP */
-#else  /* HAVE_MMAP */
-    #define USE_MMAP_BIT            (SIZE_T_ZERO)
-
-    #define MMAP(s)                 MFAIL
-    #define MUNMAP(a, s)            (-1)
-    #define DIRECT_MMAP(s)          MFAIL
-    #define CALL_DIRECT_MMAP(s)     DIRECT_MMAP(s)
-    #define CALL_MMAP(s)            MMAP(s)
-    #define CALL_MUNMAP(a, s)       MUNMAP((a), (s))
-#endif /* HAVE_MMAP */
-
-/**
- * Define CALL_MREMAP
- */
-#if HAVE_MMAP && HAVE_MREMAP
-    #ifdef MREMAP
-        #define CALL_MREMAP(addr, osz, nsz, mv) MREMAP((addr), (osz), (nsz), (mv))
-    #else /* MREMAP */
-        #define CALL_MREMAP(addr, osz, nsz, mv) MREMAP_DEFAULT((addr), (osz), (nsz), (mv))
-    #endif /* MREMAP */
-#else  /* HAVE_MMAP && HAVE_MREMAP */
-    #define CALL_MREMAP(addr, osz, nsz, mv)     MFAIL
-#endif /* HAVE_MMAP && HAVE_MREMAP */
-
-/* mstate bit set if continguous morecore disabled or failed */
-#define USE_NONCONTIGUOUS_BIT (4U)
-
-/* segment bit set in create_mspace_with_base */
-#define EXTERN_BIT            (8U)
-
-
-/* --------------------------- Lock preliminaries ------------------------ */
-
-/*
-  When locks are defined, there is one global lock, plus
-  one per-mspace lock.
-
-  The global lock_ensures that mparams.magic and other unique
-  mparams values are initialized only once. It also protects
-  sequences of calls to MORECORE.  In many cases sys_alloc requires
-  two calls, that should not be interleaved with calls by other
-  threads.  This does not protect against direct calls to MORECORE
-  by other threads not using this lock, so there is still code to
-  cope the best we can on interference.
-
-  Per-mspace locks surround calls to malloc, free, etc.
-  By default, locks are simple non-reentrant mutexes.
-
-  Because lock-protected regions generally have bounded times, it is
-  OK to use the supplied simple spinlocks. Spinlocks are likely to
-  improve performance for lightly contended applications, but worsen
-  performance under heavy contention.
-
-  If USE_LOCKS is > 1, the definitions of lock routines here are
-  bypassed, in which case you will need to define the type MLOCK_T,
-  and at least INITIAL_LOCK, DESTROY_LOCK, ACQUIRE_LOCK, RELEASE_LOCK
-  and TRY_LOCK.  You must also declare a
-    static MLOCK_T malloc_global_mutex = { initialization values };.
-
-*/
-
-#if !USE_LOCKS
-#define USE_LOCK_BIT               (0U)
-#define INITIAL_LOCK(l)            (0)
-#define DESTROY_LOCK(l)            (0)
-#define ACQUIRE_MALLOC_GLOBAL_LOCK()
-#define RELEASE_MALLOC_GLOBAL_LOCK()
-
-#else
-#if USE_LOCKS > 1
-/* -----------------------  User-defined locks ------------------------ */
-/* Define your own lock implementation here */
-/* #define INITIAL_LOCK(lk)  ... */
-/* #define DESTROY_LOCK(lk)  ... */
-/* #define ACQUIRE_LOCK(lk)  ... */
-/* #define RELEASE_LOCK(lk)  ... */
-/* #define TRY_LOCK(lk) ... */
-/* static MLOCK_T malloc_global_mutex = ... */
-
-#elif USE_SPIN_LOCKS
-
-/* First, define CAS_LOCK and CLEAR_LOCK on ints */
-/* Note CAS_LOCK defined to return 0 on success */
-
-#if defined(__GNUC__)&& (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 1))
-#define CAS_LOCK(sl)     __sync_lock_test_and_set(sl, 1)
-#define CLEAR_LOCK(sl)   __sync_lock_release(sl)
-
-#elif (defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__)))
-/* Custom spin locks for older gcc on x86 */
-static FORCEINLINE int x86_cas_lock(int *sl) {
-  int ret;
-  int val = 1;
-  int cmp = 0;
-  __asm__ __volatile__  ("lock; cmpxchgl %1, %2"
-                         : "=a" (ret)
-                         : "r" (val), "m" (*(sl)), "0"(cmp)
-                         : "memory", "cc");
-  return ret;
-}
-
-static FORCEINLINE void x86_clear_lock(int* sl) {
-  assert(*sl != 0);
-  int prev = 0;
-  int ret;
-  __asm__ __volatile__ ("lock; xchgl %0, %1"
-                        : "=r" (ret)
-                        : "m" (*(sl)), "0"(prev)
-                        : "memory");
-}
-
-#define CAS_LOCK(sl)     x86_cas_lock(sl)
-#define CLEAR_LOCK(sl)   x86_clear_lock(sl)
-
-#else /* Win32 MSC */
-#define CAS_LOCK(sl)     interlockedexchange(sl, (LONG)1)
-#define CLEAR_LOCK(sl)   interlockedexchange (sl, (LONG)0)
-
-#endif /* ... gcc spins locks ... */
-
-/* How to yield for a spin lock */
-#define SPINS_PER_YIELD       63
-#if defined(_MSC_VER)
-#define SLEEP_EX_DURATION     50 /* delay for yield/sleep */
-#define SPIN_LOCK_YIELD  SleepEx(SLEEP_EX_DURATION, FALSE)
-#elif defined (__SVR4) && defined (__sun) /* solaris */
-#define SPIN_LOCK_YIELD   thr_yield();
-#elif !defined(LACKS_SCHED_H)
-#define SPIN_LOCK_YIELD   sched_yield();
-#else
-#define SPIN_LOCK_YIELD
-#endif /* ... yield ... */
-
-#if !defined(USE_RECURSIVE_LOCKS) || USE_RECURSIVE_LOCKS == 0
-/* Plain spin locks use single word (embedded in malloc_states) */
-static int spin_acquire_lock(int *sl) {
-  int spins = 0;
-  while (*(volatile int *)sl != 0 || CAS_LOCK(sl)) {
-    if ((++spins & SPINS_PER_YIELD) == 0) {
-      SPIN_LOCK_YIELD;
-    }
-  }
-  return 0;
-}
-
-#define MLOCK_T               int
-#define TRY_LOCK(sl)          !CAS_LOCK(sl)
-#define RELEASE_LOCK(sl)      CLEAR_LOCK(sl)
-#define ACQUIRE_LOCK(sl)      (CAS_LOCK(sl)? spin_acquire_lock(sl) : 0)
-#define INITIAL_LOCK(sl)      (*sl = 0)
-#define DESTROY_LOCK(sl)      (0)
-static MLOCK_T malloc_global_mutex = 0;
-
-#else /* USE_RECURSIVE_LOCKS */
-/* types for lock owners */
-#ifdef WIN32
-#define THREAD_ID_T           DWORD
-#define CURRENT_THREAD        GetCurrentThreadId()
-#define EQ_OWNER(X,Y)         ((X) == (Y))
-#else
-/*
-  Note: the following assume that pthread_t is a type that can be
-  initialized to (casted) zero. If this is not the case, you will need to
-  somehow redefine these or not use spin locks.
-*/
-#define THREAD_ID_T           pthread_t
-#define CURRENT_THREAD        pthread_self()
-#define EQ_OWNER(X,Y)         pthread_equal(X, Y)
-#endif
-
-struct malloc_recursive_lock {
-  int sl;
-  unsigned int c;
-  THREAD_ID_T threadid;
-};
-
-#define MLOCK_T  struct malloc_recursive_lock
-static MLOCK_T malloc_global_mutex = { 0, 0, (THREAD_ID_T)0};
-
-static FORCEINLINE void recursive_release_lock(MLOCK_T *lk) {
-  assert(lk->sl != 0);
-  if (--lk->c == 0) {
-    CLEAR_LOCK(&lk->sl);
-  }
-}
-
-static FORCEINLINE int recursive_acquire_lock(MLOCK_T *lk) {
-  THREAD_ID_T mythreadid = CURRENT_THREAD;
-  int spins = 0;
-  for (;;) {
-    if (*((volatile int *)(&lk->sl)) == 0) {
-      if (!CAS_LOCK(&lk->sl)) {
-        lk->threadid = mythreadid;
-        lk->c = 1;
-        return 0;
-      }
-    }
-    else if (EQ_OWNER(lk->threadid, mythreadid)) {
-      ++lk->c;
-      return 0;
-    }
-    if ((++spins & SPINS_PER_YIELD) == 0) {
-      SPIN_LOCK_YIELD;
-    }
-  }
-}
-
-static FORCEINLINE int recursive_try_lock(MLOCK_T *lk) {
-  THREAD_ID_T mythreadid = CURRENT_THREAD;
-  if (*((volatile int *)(&lk->sl)) == 0) {
-    if (!CAS_LOCK(&lk->sl)) {
-      lk->threadid = mythreadid;
-      lk->c = 1;
-      return 1;
-    }
-  }
-  else if (EQ_OWNER(lk->threadid, mythreadid)) {
-    ++lk->c;
-    return 1;
-  }
-  return 0;
-}
-
-#define RELEASE_LOCK(lk)      recursive_release_lock(lk)
-#define TRY_LOCK(lk)          recursive_try_lock(lk)
-#define ACQUIRE_LOCK(lk)      recursive_acquire_lock(lk)
-#define INITIAL_LOCK(lk)      ((lk)->threadid = (THREAD_ID_T)0, (lk)->sl = 0, (lk)->c = 0)
-#define DESTROY_LOCK(lk)      (0)
-#endif /* USE_RECURSIVE_LOCKS */
-
-#elif defined(WIN32) /* Win32 critical sections */
-#define MLOCK_T               CRITICAL_SECTION
-#define ACQUIRE_LOCK(lk)      (EnterCriticalSection(lk), 0)
-#define RELEASE_LOCK(lk)      LeaveCriticalSection(lk)
-#define TRY_LOCK(lk)          TryEnterCriticalSection(lk)
-#define INITIAL_LOCK(lk)      (!InitializeCriticalSectionAndSpinCount((lk), 0x80000000|4000))
-#define DESTROY_LOCK(lk)      (DeleteCriticalSection(lk), 0)
-#define NEED_GLOBAL_LOCK_INIT
-
-static MLOCK_T malloc_global_mutex;
-static volatile LONG malloc_global_mutex_status;
-
-/* Use spin loop to initialize global lock */
-static void init_malloc_global_mutex() {
-  for (;;) {
-    long stat = malloc_global_mutex_status;
-    if (stat > 0)
-      return;
-    /* transition to < 0 while initializing, then to > 0) */
-    if (stat == 0 &&
-        interlockedcompareexchange(&malloc_global_mutex_status, (LONG)-1, (LONG)0) == 0) {
-      InitializeCriticalSection(&malloc_global_mutex);
-      interlockedexchange(&malloc_global_mutex_status, (LONG)1);
-      return;
-    }
-    SleepEx(0, FALSE);
-  }
-}
-
-#else /* pthreads-based locks */
-#define MLOCK_T               pthread_mutex_t
-#define ACQUIRE_LOCK(lk)      pthread_mutex_lock(lk)
-#define RELEASE_LOCK(lk)      pthread_mutex_unlock(lk)
-#define TRY_LOCK(lk)          (!pthread_mutex_trylock(lk))
-#define INITIAL_LOCK(lk)      pthread_init_lock(lk)
-#define DESTROY_LOCK(lk)      pthread_mutex_destroy(lk)
-
-#if defined(USE_RECURSIVE_LOCKS) && USE_RECURSIVE_LOCKS != 0 && defined(linux) && !defined(PTHREAD_MUTEX_RECURSIVE)
-/* Cope with old-style linux recursive lock initialization by adding */
-/* skipped internal declaration from pthread.h */
-extern int pthread_mutexattr_setkind_np __P ((pthread_mutexattr_t *__attr,
-                                              int __kind));
-#define PTHREAD_MUTEX_RECURSIVE PTHREAD_MUTEX_RECURSIVE_NP
-#define pthread_mutexattr_settype(x,y) pthread_mutexattr_setkind_np(x,y)
-#endif /* USE_RECURSIVE_LOCKS ... */
-
-static MLOCK_T malloc_global_mutex = PTHREAD_MUTEX_INITIALIZER;
-
-static int pthread_init_lock (MLOCK_T *lk) {
-  pthread_mutexattr_t attr;
-  if (pthread_mutexattr_init(&attr)) return 1;
-#if defined(USE_RECURSIVE_LOCKS) && USE_RECURSIVE_LOCKS != 0
-  if (pthread_mutexattr_settype(&attr, PTHREAD_MUTEX_RECURSIVE)) return 1;
-#endif
-  if (pthread_mutex_init(lk, &attr)) return 1;
-  if (pthread_mutexattr_destroy(&attr)) return 1;
-  return 0;
-}
-
-#endif /* ... lock types ... */
-
-/* Common code for all lock types */
-#define USE_LOCK_BIT               (2U)
-
-#ifndef ACQUIRE_MALLOC_GLOBAL_LOCK
-#define ACQUIRE_MALLOC_GLOBAL_LOCK()  ACQUIRE_LOCK(&malloc_global_mutex);
-#endif
-
-#ifndef RELEASE_MALLOC_GLOBAL_LOCK
-#define RELEASE_MALLOC_GLOBAL_LOCK()  RELEASE_LOCK(&malloc_global_mutex);
-#endif
-
-#endif /* USE_LOCKS */
-
-/* -----------------------  Chunk representations ------------------------ */
-
-/*
-  (The following includes lightly edited explanations by Colin Plumb.)
-
-  The malloc_chunk declaration below is misleading (but accurate and
-  necessary).  It declares a "view" into memory allowing access to
-  necessary fields at known offsets from a given base.
-
-  Chunks of memory are maintained using a `boundary tag' method as
-  originally described by Knuth.  (See the paper by Paul Wilson
-  ftp://ftp.cs.utexas.edu/pub/garbage/allocsrv.ps for a survey of such
-  techniques.)  Sizes of free chunks are stored both in the front of
-  each chunk and at the end.  This makes consolidating fragmented
-  chunks into bigger chunks fast.  The head fields also hold bits
-  representing whether chunks are free or in use.
-
-  Here are some pictures to make it clearer.  They are "exploded" to
-  show that the state of a chunk can be thought of as extending from
-  the high 31 bits of the head field of its header through the
-  prev_foot and PINUSE_BIT bit of the following chunk header.
-
-  A chunk that's in use looks like:
-
-   chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-           | Size of previous chunk (if P = 0)                             |
-           +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ |P|
-         | Size of this chunk                                         1| +-+
-   mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         |                                                               |
-         +-                                                             -+
-         |                                                               |
-         +-                                                             -+
-         |                                                               :
-         +-      size - sizeof(size_t) available payload bytes          -+
-         :                                                               |
- chunk-> +-                                                             -+
-         |                                                               |
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-       +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ |1|
-       | Size of next chunk (may or may not be in use)               | +-+
- mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-
-    And if it's free, it looks like this:
-
-   chunk-> +-                                                             -+
-           | User payload (must be in use, or we would have merged!)       |
-           +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ |P|
-         | Size of this chunk                                         0| +-+
-   mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         | Next pointer                                                  |
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         | Prev pointer                                                  |
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         |                                                               :
-         +-      size - sizeof(struct chunk) unused bytes               -+
-         :                                                               |
- chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-         | Size of this chunk                                            |
-         +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-       +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ |0|
-       | Size of next chunk (must be in use, or we would have merged)| +-+
- mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-       |                                                               :
-       +- User payload                                                -+
-       :                                                               |
-       +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-                                                                     |0|
-                                                                     +-+
-  Note that since we always merge adjacent free chunks, the chunks
-  adjacent to a free chunk must be in use.
-
-  Given a pointer to a chunk (which can be derived trivially from the
-  payload pointer) we can, in O(1) time, find out whether the adjacent
-  chunks are free, and if so, unlink them from the lists that they
-  are on and merge them with the current chunk.
-
-  Chunks always begin on even word boundaries, so the mem portion
-  (which is returned to the user) is also on an even word boundary, and
-  thus at least double-word aligned.
-
-  The P (PINUSE_BIT) bit, stored in the unused low-order bit of the
-  chunk size (which is always a multiple of two words), is an in-use
-  bit for the *previous* chunk.  If that bit is *clear*, then the
-  word before the current chunk size contains the previous chunk
-  size, and can be used to find the front of the previous chunk.
-  The very first chunk allocated always has this bit set, preventing
-  access to non-existent (or non-owned) memory. If pinuse is set for
-  any given chunk, then you CANNOT determine the size of the
-  previous chunk, and might even get a memory addressing fault when
-  trying to do so.
-
-  The C (CINUSE_BIT) bit, stored in the unused second-lowest bit of
-  the chunk size redundantly records whether the current chunk is
-  inuse (unless the chunk is mmapped). This redundancy enables usage
-  checks within free and realloc, and reduces indirection when freeing
-  and consolidating chunks.
-
-  Each freshly allocated chunk must have both cinuse and pinuse set.
-  That is, each allocated chunk borders either a previously allocated
-  and still in-use chunk, or the base of its memory arena. This is
-  ensured by making all allocations from the `lowest' part of any
-  found chunk.  Further, no free chunk physically borders another one,
-  so each free chunk is known to be preceded and followed by either
-  inuse chunks or the ends of memory.
-
-  Note that the `foot' of the current chunk is actually represented
-  as the prev_foot of the NEXT chunk. This makes it easier to
-  deal with alignments etc but can be very confusing when trying
-  to extend or adapt this code.
-
-  The exceptions to all this are
-
-     1. The special chunk `top' is the top-most available chunk (i.e.,
-        the one bordering the end of available memory). It is treated
-        specially.  Top is never included in any bin, is used only if
-        no other chunk is available, and is released back to the
-        system if it is very large (see M_TRIM_THRESHOLD).  In effect,
-        the top chunk is treated as larger (and thus less well
-        fitting) than any other available chunk.  The top chunk
-        doesn't update its trailing size field since there is no next
-        contiguous chunk that would have to index off it. However,
-        space is still allocated for it (TOP_FOOT_SIZE) to enable
-        separation or merging when space is extended.
-
-     3. Chunks allocated via mmap, have both cinuse and pinuse bits
-        cleared in their head fields.  Because they are allocated
-        one-by-one, each must carry its own prev_foot field, which is
-        also used to hold the offset this chunk has within its mmapped
-        region, which is needed to preserve alignment. Each mmapped
-        chunk is trailed by the first two fields of a fake next-chunk
-        for sake of usage checks.
-
-*/
-
-struct malloc_chunk {
-  size_t               prev_foot;  /* Size of previous chunk (if free).  */
-  size_t               head;       /* Size and inuse bits. */
-  struct malloc_chunk* fd;         /* double links -- used only if free. */
-  struct malloc_chunk* bk;
-};
-
-typedef struct malloc_chunk  mchunk;
-typedef struct malloc_chunk* mchunkptr;
-typedef struct malloc_chunk* sbinptr;  /* The type of bins of chunks */
-typedef unsigned int bindex_t;         /* Described below */
-typedef unsigned int binmap_t;         /* Described below */
-typedef unsigned int flag_t;           /* The type of various bit flag sets */
-
-/* ------------------- Chunks sizes and alignments ----------------------- */
-
-#define MCHUNK_SIZE         (sizeof(mchunk))
-
-#if FOOTERS
-#define CHUNK_OVERHEAD      (TWO_SIZE_T_SIZES)
-#else /* FOOTERS */
-#define CHUNK_OVERHEAD      (SIZE_T_SIZE)
-#endif /* FOOTERS */
-
-/* MMapped chunks need a second word of overhead ... */
-#define MMAP_CHUNK_OVERHEAD (TWO_SIZE_T_SIZES)
-/* ... and additional padding for fake next-chunk at foot */
-#define MMAP_FOOT_PAD       (FOUR_SIZE_T_SIZES)
-
-/* The smallest size we can malloc is an aligned minimal chunk */
-#define MIN_CHUNK_SIZE\
-  ((MCHUNK_SIZE + CHUNK_ALIGN_MASK) & ~CHUNK_ALIGN_MASK)
-
-/* conversion from malloc headers to user pointers, and back */
-#define chunk2mem(p)        ((void*)((char*)(p)       + TWO_SIZE_T_SIZES))
-#define mem2chunk(mem)      ((mchunkptr)((char*)(mem) - TWO_SIZE_T_SIZES))
-/* chunk associated with aligned address A */
-#define align_as_chunk(A)   (mchunkptr)((A) + align_offset(chunk2mem(A)))
-
-/* Bounds on request (not chunk) sizes. */
-#define MAX_REQUEST         ((-MIN_CHUNK_SIZE) << 2)
-#define MIN_REQUEST         (MIN_CHUNK_SIZE - CHUNK_OVERHEAD - SIZE_T_ONE)
-
-/* pad request bytes into a usable size */
-#define pad_request(req) \
-   (((req) + CHUNK_OVERHEAD + CHUNK_ALIGN_MASK) & ~CHUNK_ALIGN_MASK)
-
-/* pad request, checking for minimum (but not maximum) */
-#define request2size(req) \
-  (((req) < MIN_REQUEST)? MIN_CHUNK_SIZE : pad_request(req))
-
-
-/* ------------------ Operations on head and foot fields ----------------- */
-
-/*
-  The head field of a chunk is or'ed with PINUSE_BIT when previous
-  adjacent chunk in use, and or'ed with CINUSE_BIT if this chunk is in
-  use, unless mmapped, in which case both bits are cleared.
-
-  FLAG4_BIT is not used by this malloc, but might be useful in extensions.
-*/
-
-#define PINUSE_BIT          (SIZE_T_ONE)
-#define CINUSE_BIT          (SIZE_T_TWO)
-#define FLAG4_BIT           (SIZE_T_FOUR)
-#define INUSE_BITS          (PINUSE_BIT|CINUSE_BIT)
-#define FLAG_BITS           (PINUSE_BIT|CINUSE_BIT|FLAG4_BIT)
-
-/* Head value for fenceposts */
-#define FENCEPOST_HEAD      (INUSE_BITS|SIZE_T_SIZE)
-
-/* extraction of fields from head words */
-#define cinuse(p)           ((p)->head & CINUSE_BIT)
-#define pinuse(p)           ((p)->head & PINUSE_BIT)
-#define flag4inuse(p)       ((p)->head & FLAG4_BIT)
-#define is_inuse(p)         (((p)->head & INUSE_BITS) != PINUSE_BIT)
-#define is_mmapped(p)       (((p)->head & INUSE_BITS) == 0)
-
-#define chunksize(p)        ((p)->head & ~(FLAG_BITS))
-
-#define clear_pinuse(p)     ((p)->head &= ~PINUSE_BIT)
-#define set_flag4(p)        ((p)->head |= FLAG4_BIT)
-#define clear_flag4(p)      ((p)->head &= ~FLAG4_BIT)
-
-/* Treat space at ptr +/- offset as a chunk */
-#define chunk_plus_offset(p, s)  ((mchunkptr)(((char*)(p)) + (s)))
-#define chunk_minus_offset(p, s) ((mchunkptr)(((char*)(p)) - (s)))
-
-/* Ptr to next or previous physical malloc_chunk. */
-#define next_chunk(p) ((mchunkptr)( ((char*)(p)) + ((p)->head & ~FLAG_BITS)))
-#define prev_chunk(p) ((mchunkptr)( ((char*)(p)) - ((p)->prev_foot) ))
-
-/* extract next chunk's pinuse bit */
-#define next_pinuse(p)  ((next_chunk(p)->head) & PINUSE_BIT)
-
-/* Get/set size at footer */
-#define get_foot(p, s)  (((mchunkptr)((char*)(p) + (s)))->prev_foot)
-#define set_foot(p, s)  (((mchunkptr)((char*)(p) + (s)))->prev_foot = (s))
-
-/* Set size, pinuse bit, and foot */
-#define set_size_and_pinuse_of_free_chunk(p, s)\
-  ((p)->head = (s|PINUSE_BIT), set_foot(p, s))
-
-/* Set size, pinuse bit, foot, and clear next pinuse */
-#define set_free_with_pinuse(p, s, n)\
-  (clear_pinuse(n), set_size_and_pinuse_of_free_chunk(p, s))
-
-/* Get the internal overhead associated with chunk p */
-#define overhead_for(p)\
- (is_mmapped(p)? MMAP_CHUNK_OVERHEAD : CHUNK_OVERHEAD)
-
-/* Return true if malloced space is not necessarily cleared */
-#if MMAP_CLEARS
-#define calloc_must_clear(p) (!is_mmapped(p))
-#else /* MMAP_CLEARS */
-#define calloc_must_clear(p) (1)
-#endif /* MMAP_CLEARS */
-
-/* ---------------------- Overlaid data structures ----------------------- */
-
-/*
-  When chunks are not in use, they are treated as nodes of either
-  lists or trees.
-
-  "Small"  chunks are stored in circular doubly-linked lists, and look
-  like this:
-
-    chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Size of previous chunk                            |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-    `head:' |             Size of chunk, in bytes                         |P|
-      mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Forward pointer to next chunk in list             |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Back pointer to previous chunk in list            |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Unused space (may be 0 bytes long)                .
-            .                                                               .
-            .                                                               |
-nextchunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-    `foot:' |             Size of chunk, in bytes                           |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-
-  Larger chunks are kept in a form of bitwise digital trees (aka
-  tries) keyed on chunksizes.  Because malloc_tree_chunks are only for
-  free chunks greater than 256 bytes, their size doesn't impose any
-  constraints on user chunk sizes.  Each node looks like:
-
-    chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Size of previous chunk                            |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-    `head:' |             Size of chunk, in bytes                         |P|
-      mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Forward pointer to next chunk of same size        |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Back pointer to previous chunk of same size       |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Pointer to left child (child[0])                  |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Pointer to right child (child[1])                 |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Pointer to parent                                 |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             bin index of this chunk                           |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-            |             Unused space                                      .
-            .                                                               |
-nextchunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-    `foot:' |             Size of chunk, in bytes                           |
-            +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
-
-  Each tree holding treenodes is a tree of unique chunk sizes.  Chunks
-  of the same size are arranged in a circularly-linked list, with only
-  the oldest chunk (the next to be used, in our FIFO ordering)
-  actually in the tree.  (Tree members are distinguished by a non-null
-  parent pointer.)  If a chunk with the same size an an existing node
-  is inserted, it is linked off the existing node using pointers that
-  work in the same way as fd/bk pointers of small chunks.
-
-  Each tree contains a power of 2 sized range of chunk sizes (the
-  smallest is 0x100 <= x < 0x180), which is is divided in half at each
-  tree level, with the chunks in the smaller half of the range (0x100
-  <= x < 0x140 for the top nose) in the left subtree and the larger
-  half (0x140 <= x < 0x180) in the right subtree.  This is, of course,
-  done by inspecting individual bits.
-
-  Using these rules, each node's left subtree contains all smaller
-  sizes than its right subtree.  However, the node at the root of each
-  subtree has no particular ordering relationship to either.  (The
-  dividing line between the subtree sizes is based on trie relation.)
-  If we remove the last chunk of a given size from the interior of the
-  tree, we need to replace it with a leaf node.  The tree ordering
-  rules permit a node to be replaced by any leaf below it.
-
-  The smallest chunk in a tree (a common operation in a best-fit
-  allocator) can be found by walking a path to the leftmost leaf in
-  the tree.  Unlike a usual binary tree, where we follow left child
-  pointers until we reach a null, here we follow the right child
-  pointer any time the left one is null, until we reach a leaf with
-  both child pointers null. The smallest chunk in the tree will be
-  somewhere along that path.
-
-  The worst case number of steps to add, find, or remove a node is
-  bounded by the number of bits differentiating chunks within
-  bins. Under current bin calculations, this ranges from 6 up to 21
-  (for 32 bit sizes) or up to 53 (for 64 bit sizes). The typical case
-  is of course much better.
-*/
-
-struct malloc_tree_chunk {
-  /* The first four fields must be compatible with malloc_chunk */
-  size_t                    prev_foot;
-  size_t                    head;
-  struct malloc_tree_chunk* fd;
-  struct malloc_tree_chunk* bk;
-
-  struct malloc_tree_chunk* child[2];
-  struct malloc_tree_chunk* parent;
-  bindex_t                  index;
-};
-
-typedef struct malloc_tree_chunk  tchunk;
-typedef struct malloc_tree_chunk* tchunkptr;
-typedef struct malloc_tree_chunk* tbinptr; /* The type of bins of trees */
-
-/* A little helper macro for trees */
-#define leftmost_child(t) ((t)->child[0] != 0? (t)->child[0] : (t)->child[1])
-
-/* ----------------------------- Segments -------------------------------- */
-
-/*
-  Each malloc space may include non-contiguous segments, held in a
-  list headed by an embedded malloc_segment record representing the
-  top-most space. Segments also include flags holding properties of
-  the space. Large chunks that are directly allocated by mmap are not
-  included in this list. They are instead independently created and
-  destroyed without otherwise keeping track of them.
-
-  Segment management mainly comes into play for spaces allocated by
-  MMAP.  Any call to MMAP might or might not return memory that is
-  adjacent to an existing segment.  MORECORE normally contiguously
-  extends the current space, so this space is almost always adjacent,
-  which is simpler and faster to deal with. (This is why MORECORE is
-  used preferentially to MMAP when both are available -- see
-  sys_alloc.)  When allocating using MMAP, we don't use any of the
-  hinting mechanisms (inconsistently) supported in various
-  implementations of unix mmap, or distinguish reserving from
-  committing memory. Instead, we just ask for space, and exploit
-  contiguity when we get it.  It is probably possible to do
-  better than this on some systems, but no general scheme seems
-  to be significantly better.
-
-  Management entails a simpler variant of the consolidation scheme
-  used for chunks to reduce fragmentation -- new adjacent memory is
-  normally prepended or appended to an existing segment. However,
-  there are limitations compared to chunk consolidation that mostly
-  reflect the fact that segment processing is relatively infrequent
-  (occurring only when getting memory from system) and that we
-  don't expect to have huge numbers of segments:
-
-  * Segments are not indexed, so traversal requires linear scans.  (It
-    would be possible to index these, but is not worth the extra
-    overhead and complexity for most programs on most platforms.)
-  * New segments are only appended to old ones when holding top-most
-    memory; if they cannot be prepended to others, they are held in
-    different segments.
-
-  Except for the top-most segment of an mstate, each segment record
-  is kept at the tail of its segment. Segments are added by pushing
-  segment records onto the list headed by &mstate.seg for the
-  containing mstate.
-
-  Segment flags control allocation/merge/deallocation policies:
-  * If EXTERN_BIT set, then we did not allocate this segment,
-    and so should not try to deallocate or merge with others.
-    (This currently holds only for the initial segment passed
-    into create_mspace_with_base.)
-  * If USE_MMAP_BIT set, the segment may be merged with
-    other surrounding mmapped segments and trimmed/de-allocated
-    using munmap.
-  * If neither bit is set, then the segment was obtained using
-    MORECORE so can be merged with surrounding MORECORE'd segments
-    and deallocated/trimmed using MORECORE with negative arguments.
-*/
-
-struct malloc_segment {
-  char*        base;             /* base address */
-  size_t       size;             /* allocated size */
-  struct malloc_segment* next;   /* ptr to next segment */
-  flag_t       sflags;           /* mmap and extern flag */
-};
-
-#define is_mmapped_segment(S)  ((S)->sflags & USE_MMAP_BIT)
-#define is_extern_segment(S)   ((S)->sflags & EXTERN_BIT)
-
-typedef struct malloc_segment  msegment;
-typedef struct malloc_segment* msegmentptr;
-
-/* ---------------------------- malloc_state ----------------------------- */
-
-/*
-   A malloc_state holds all of the bookkeeping for a space.
-   The main fields are:
-
-  Top
-    The topmost chunk of the currently active segment. Its size is
-    cached in topsize.  The actual size of topmost space is
-    topsize+TOP_FOOT_SIZE, which includes space reserved for adding
-    fenceposts and segment records if necessary when getting more
-    space from the system.  The size at which to autotrim top is
-    cached from mparams in trim_check, except that it is disabled if
-    an autotrim fails.
-
-  Designated victim (dv)
-    This is the preferred chunk for servicing small requests that
-    don't have exact fits.  It is normally the chunk split off most
-    recently to service another small request.  Its size is cached in
-    dvsize. The link fields of this chunk are not maintained since it
-    is not kept in a bin.
-
-  SmallBins
-    An array of bin headers for free chunks.  These bins hold chunks
-    with sizes less than MIN_LARGE_SIZE bytes. Each bin contains
-    chunks of all the same size, spaced 8 bytes apart.  To simplify
-    use in double-linked lists, each bin header acts as a malloc_chunk
-    pointing to the real first node, if it exists (else pointing to
-    itself).  This avoids special-casing for headers.  But to avoid
-    waste, we allocate only the fd/bk pointers of bins, and then use
-    repositioning tricks to treat these as the fields of a chunk.
-
-  TreeBins
-    Treebins are pointers to the roots of trees holding a range of
-    sizes. There are 2 equally spaced treebins for each power of two
-    from TREE_SHIFT to TREE_SHIFT+16. The last bin holds anything
-    larger.
-
-  Bin maps
-    There is one bit map for small bins ("smallmap") and one for
-    treebins ("treemap).  Each bin sets its bit when non-empty, and
-    clears the bit when empty.  Bit operations are then used to avoid
-    bin-by-bin searching -- nearly all "search" is done without ever
-    looking at bins that won't be selected.  The bit maps
-    conservatively use 32 bits per map word, even if on 64bit system.
-    For a good description of some of the bit-based techniques used
-    here, see Henry S. Warren Jr's book "Hacker's Delight" (and
-    supplement at http://hackersdelight.org/). Many of these are
-    intended to reduce the branchiness of paths through malloc etc, as
-    well as to reduce the number of memory locations read or written.
-
-  Segments
-    A list of segments headed by an embedded malloc_segment record
-    representing the initial space.
-
-  Address check support
-    The least_addr field is the least address ever obtained from
-    MORECORE or MMAP. Attempted frees and reallocs of any address less
-    than this are trapped (unless INSECURE is defined).
-
-  Magic tag
-    A cross-check field that should always hold same value as mparams.magic.
-
-  Max allowed footprint
-    The maximum allowed bytes to allocate from system (zero means no limit)
-
-  Flags
-    Bits recording whether to use MMAP, locks, or contiguous MORECORE
-
-  Statistics
-    Each space keeps track of current and maximum system memory
-    obtained via MORECORE or MMAP.
-
-  Trim support
-    Fields holding the amount of unused topmost memory that should trigger
-    trimming, and a counter to force periodic scanning to release unused
-    non-topmost segments.
-
-  Locking
-    If USE_LOCKS is defined, the "mutex" lock is acquired and released
-    around every public call using this mspace.
-
-  Extension support
-    A void* pointer and a size_t field that can be used to help implement
-    extensions to this malloc.
-*/
-
-/* Bin types, widths and sizes */
-#define NSMALLBINS        (32U)
-#define NTREEBINS         (32U)
-#define SMALLBIN_SHIFT    (3U)
-#define SMALLBIN_WIDTH    (SIZE_T_ONE << SMALLBIN_SHIFT)
-#define TREEBIN_SHIFT     (8U)
-#define MIN_LARGE_SIZE    (SIZE_T_ONE << TREEBIN_SHIFT)
-#define MAX_SMALL_SIZE    (MIN_LARGE_SIZE - SIZE_T_ONE)
-#define MAX_SMALL_REQUEST (MAX_SMALL_SIZE - CHUNK_ALIGN_MASK - CHUNK_OVERHEAD)
-
-struct malloc_state {
-  binmap_t   smallmap;
-  binmap_t   treemap;
-  size_t     dvsize;
-  size_t     topsize;
-  char*      least_addr;
-  mchunkptr  dv;
-  mchunkptr  top;
-  size_t     trim_check;
-  size_t     release_checks;
-  size_t     magic;
-  mchunkptr  smallbins[(NSMALLBINS+1)*2];
-  tbinptr    treebins[NTREEBINS];
-  size_t     footprint;
-  size_t     max_footprint;
-  size_t     footprint_limit; /* zero means no limit */
-  flag_t     mflags;
-#if USE_LOCKS
-  MLOCK_T    mutex;     /* locate lock among fields that rarely change */
-#endif /* USE_LOCKS */
-  msegment   seg;
-  void*      extp;      /* Unused but available for extensions */
-  size_t     exts;
-};
-
-typedef struct malloc_state*    mstate;
-
-/* ------------- Global malloc_state and malloc_params ------------------- */
-
-/*
-  malloc_params holds global properties, including those that can be
-  dynamically set using mallopt. There is a single instance, mparams,
-  initialized in init_mparams. Note that the non-zeroness of "magic"
-  also serves as an initialization flag.
-*/
-
-struct malloc_params {
-  size_t magic;
-  size_t page_size;
-  size_t granularity;
-  size_t mmap_threshold;
-  size_t trim_threshold;
-  flag_t default_mflags;
-};
-
-static struct malloc_params mparams;
-
-/* Ensure mparams initialized */
-#define ensure_initialization() (void)(mparams.magic != 0 || init_mparams())
-
-#if !ONLY_MSPACES
-
-/* The global malloc_state used for all non-"mspace" calls */
-static struct malloc_state _gm_;
-#define gm                 (&_gm_)
-#define is_global(M)       ((M) == &_gm_)
-
-#endif /* !ONLY_MSPACES */
-
-#define is_initialized(M)  ((M)->top != 0)
-
-/* -------------------------- system alloc setup ------------------------- */
-
-/* Operations on mflags */
-
-#define use_lock(M)           ((M)->mflags &   USE_LOCK_BIT)
-#define enable_lock(M)        ((M)->mflags |=  USE_LOCK_BIT)
-#if USE_LOCKS
-#define disable_lock(M)       ((M)->mflags &= ~USE_LOCK_BIT)
-#else
-#define disable_lock(M)
-#endif
-
-#define use_mmap(M)           ((M)->mflags &   USE_MMAP_BIT)
-#define enable_mmap(M)        ((M)->mflags |=  USE_MMAP_BIT)
-#if HAVE_MMAP
-#define disable_mmap(M)       ((M)->mflags &= ~USE_MMAP_BIT)
-#else
-#define disable_mmap(M)
-#endif
-
-#define use_noncontiguous(M)  ((M)->mflags &   USE_NONCONTIGUOUS_BIT)
-#define disable_contiguous(M) ((M)->mflags |=  USE_NONCONTIGUOUS_BIT)
-
-#define set_lock(M,L)\
- ((M)->mflags = (L)?\
-  ((M)->mflags | USE_LOCK_BIT) :\
-  ((M)->mflags & ~USE_LOCK_BIT))
-
-/* page-align a size */
-#define page_align(S)\
- (((S) + (mparams.page_size - SIZE_T_ONE)) & ~(mparams.page_size - SIZE_T_ONE))
-
-/* granularity-align a size */
-#define granularity_align(S)\
-  (((S) + (mparams.granularity - SIZE_T_ONE))\
-   & ~(mparams.granularity - SIZE_T_ONE))
-
-
-/* For mmap, use granularity alignment on windows, else page-align */
-#ifdef WIN32
-#define mmap_align(S) granularity_align(S)
-#else
-#define mmap_align(S) page_align(S)
-#endif
-
-/* For sys_alloc, enough padding to ensure can malloc request on success */
-#define SYS_ALLOC_PADDING (TOP_FOOT_SIZE + MALLOC_ALIGNMENT)
-
-#define is_page_aligned(S)\
-   (((size_t)(S) & (mparams.page_size - SIZE_T_ONE)) == 0)
-#define is_granularity_aligned(S)\
-   (((size_t)(S) & (mparams.granularity - SIZE_T_ONE)) == 0)
-
-/*  True if segment S holds address A */
-#define segment_holds(S, A)\
-  ((char*)(A) >= S->base && (char*)(A) < S->base + S->size)
-
-/* Return segment holding given address */
-static msegmentptr segment_holding(mstate m, char* addr) {
-  msegmentptr sp = &m->seg;
-  for (;;) {
-    if (addr >= sp->base && addr < sp->base + sp->size)
-      return sp;
-    if ((sp = sp->next) == 0)
-      return 0;
-  }
-}
-
-/* Return true if segment contains a segment link */
-static int has_segment_link(mstate m, msegmentptr ss) {
-  msegmentptr sp = &m->seg;
-  for (;;) {
-    if ((char*)sp >= ss->base && (char*)sp < ss->base + ss->size)
-      return 1;
-    if ((sp = sp->next) == 0)
-      return 0;
-  }
-}
-
-#ifndef MORECORE_CANNOT_TRIM
-#define should_trim(M,s)  ((s) > (M)->trim_check)
-#else  /* MORECORE_CANNOT_TRIM */
-#define should_trim(M,s)  (0)
-#endif /* MORECORE_CANNOT_TRIM */
-
-/*
-  TOP_FOOT_SIZE is padding at the end of a segment, including space
-  that may be needed to place segment records and fenceposts when new
-  noncontiguous segments are added.
-*/
-#define TOP_FOOT_SIZE\
-  (align_offset(chunk2mem(0))+pad_request(sizeof(struct malloc_segment))+MIN_CHUNK_SIZE)
-
-
-/* -------------------------------  Hooks -------------------------------- */
-
-/*
-  PREACTION should be defined to return 0 on success, and nonzero on
-  failure. If you are not using locking, you can redefine these to do
-  anything you like.
-*/
-
-#if USE_LOCKS
-#define PREACTION(M)  ((use_lock(M))? ACQUIRE_LOCK(&(M)->mutex) : 0)
-#define POSTACTION(M) { if (use_lock(M)) RELEASE_LOCK(&(M)->mutex); }
-#else /* USE_LOCKS */
-
-#ifndef PREACTION
-#define PREACTION(M) (0)
-#endif  /* PREACTION */
-
-#ifndef POSTACTION
-#define POSTACTION(M)
-#endif  /* POSTACTION */
-
-#endif /* USE_LOCKS */
-
-/*
-  CORRUPTION_ERROR_ACTION is triggered upon detected bad addresses.
-  USAGE_ERROR_ACTION is triggered on detected bad frees and
-  reallocs. The argument p is an address that might have triggered the
-  fault. It is ignored by the two predefined actions, but might be
-  useful in custom actions that try to help diagnose errors.
-*/
-
-#if PROCEED_ON_ERROR
-
-/* A count of the number of corruption errors causing resets */
-int malloc_corruption_error_count;
-
-/* default corruption action */
-static void reset_on_error(mstate m);
-
-#define CORRUPTION_ERROR_ACTION(m)  reset_on_error(m)
-#define USAGE_ERROR_ACTION(m, p)
-
-#else /* PROCEED_ON_ERROR */
-
-#ifndef CORRUPTION_ERROR_ACTION
-#define CORRUPTION_ERROR_ACTION(m) ABORT
-#endif /* CORRUPTION_ERROR_ACTION */
-
-#ifndef USAGE_ERROR_ACTION
-#define USAGE_ERROR_ACTION(m,p) ABORT
-#endif /* USAGE_ERROR_ACTION */
-
-#endif /* PROCEED_ON_ERROR */
-
-
-/* -------------------------- Debugging setup ---------------------------- */
-
-#if ! DEBUG
-
-#define check_free_chunk(M,P)
-#define check_inuse_chunk(M,P)
-#define check_malloced_chunk(M,P,N)
-#define check_mmapped_chunk(M,P)
-#define check_malloc_state(M)
-#define check_top_chunk(M,P)
-
-#else /* DEBUG */
-#define check_free_chunk(M,P)       do_check_free_chunk(M,P)
-#define check_inuse_chunk(M,P)      do_check_inuse_chunk(M,P)
-#define check_top_chunk(M,P)        do_check_top_chunk(M,P)
-#define check_malloced_chunk(M,P,N) do_check_malloced_chunk(M,P,N)
-#define check_mmapped_chunk(M,P)    do_check_mmapped_chunk(M,P)
-#define check_malloc_state(M)       do_check_malloc_state(M)
-
-static void   do_check_any_chunk(mstate m, mchunkptr p);
-static void   do_check_top_chunk(mstate m, mchunkptr p);
-static void   do_check_mmapped_chunk(mstate m, mchunkptr p);
-static void   do_check_inuse_chunk(mstate m, mchunkptr p);
-static void   do_check_free_chunk(mstate m, mchunkptr p);
-static void   do_check_malloced_chunk(mstate m, void* mem, size_t s);
-static void   do_check_tree(mstate m, tchunkptr t);
-static void   do_check_treebin(mstate m, bindex_t i);
-static void   do_check_smallbin(mstate m, bindex_t i);
-static void   do_check_malloc_state(mstate m);
-static int    bin_find(mstate m, mchunkptr x);
-static size_t traverse_and_check(mstate m);
-#endif /* DEBUG */
-
-/* ---------------------------- Indexing Bins ---------------------------- */
-
-#define is_small(s)         (((s) >> SMALLBIN_SHIFT) < NSMALLBINS)
-#define small_index(s)      (bindex_t)((s)  >> SMALLBIN_SHIFT)
-#define small_index2size(i) ((i)  << SMALLBIN_SHIFT)
-#define MIN_SMALL_INDEX     (small_index(MIN_CHUNK_SIZE))
-
-/* addressing by index. See above about smallbin repositioning */
-#define smallbin_at(M, i)   ((sbinptr)((char*)&((M)->smallbins[(i)<<1])))
-#define treebin_at(M,i)     (&((M)->treebins[i]))
-
-/* assign tree index for size S to variable I. Use x86 asm if possible  */
-#if defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-#define compute_tree_index(S, I)\
-{\
-  unsigned int X = S >> TREEBIN_SHIFT;\
-  if (X == 0)\
-    I = 0;\
-  else if (X > 0xFFFF)\
-    I = NTREEBINS-1;\
-  else {\
-    unsigned int K = (unsigned) sizeof(X)*__CHAR_BIT__ - 1 - (unsigned) __builtin_clz(X); \
-    I =  (bindex_t)((K << 1) + ((S >> (K + (TREEBIN_SHIFT-1)) & 1)));\
-  }\
-}
-
-#elif defined (__INTEL_COMPILER)
-#define compute_tree_index(S, I)\
-{\
-  size_t X = S >> TREEBIN_SHIFT;\
-  if (X == 0)\
-    I = 0;\
-  else if (X > 0xFFFF)\
-    I = NTREEBINS-1;\
-  else {\
-    unsigned int K = _bit_scan_reverse (X); \
-    I =  (bindex_t)((K << 1) + ((S >> (K + (TREEBIN_SHIFT-1)) & 1)));\
-  }\
-}
-
-#elif defined(_MSC_VER) && _MSC_VER>=1300
-#define compute_tree_index(S, I)\
-{\
-  size_t X = S >> TREEBIN_SHIFT;\
-  if (X == 0)\
-    I = 0;\
-  else if (X > 0xFFFF)\
-    I = NTREEBINS-1;\
-  else {\
-    unsigned int K;\
-    _BitScanReverse((DWORD *) &K, (DWORD) X);\
-    I =  (bindex_t)((K << 1) + ((S >> (K + (TREEBIN_SHIFT-1)) & 1)));\
-  }\
-}
-
-#else /* GNUC */
-#define compute_tree_index(S, I)\
-{\
-  size_t X = S >> TREEBIN_SHIFT;\
-  if (X == 0)\
-    I = 0;\
-  else if (X > 0xFFFF)\
-    I = NTREEBINS-1;\
-  else {\
-    unsigned int Y = (unsigned int)X;\
-    unsigned int N = ((Y - 0x100) >> 16) & 8;\
-    unsigned int K = (((Y <<= N) - 0x1000) >> 16) & 4;\
-    N += K;\
-    N += K = (((Y <<= K) - 0x4000) >> 16) & 2;\
-    K = 14 - N + ((Y <<= K) >> 15);\
-    I = (K << 1) + ((S >> (K + (TREEBIN_SHIFT-1)) & 1));\
-  }\
-}
-#endif /* GNUC */
-
-/* Bit representing maximum resolved size in a treebin at i */
-#define bit_for_tree_index(i) \
-   (i == NTREEBINS-1)? (SIZE_T_BITSIZE-1) : (((i) >> 1) + TREEBIN_SHIFT - 2)
-
-/* Shift placing maximum resolved bit in a treebin at i as sign bit */
-#define leftshift_for_tree_index(i) \
-   ((i == NTREEBINS-1)? 0 : \
-    ((SIZE_T_BITSIZE-SIZE_T_ONE) - (((i) >> 1) + TREEBIN_SHIFT - 2)))
-
-/* The size of the smallest chunk held in bin with index i */
-#define minsize_for_tree_index(i) \
-   ((SIZE_T_ONE << (((i) >> 1) + TREEBIN_SHIFT)) |  \
-   (((size_t)((i) & SIZE_T_ONE)) << (((i) >> 1) + TREEBIN_SHIFT - 1)))
-
-
-/* ------------------------ Operations on bin maps ----------------------- */
-
-/* bit corresponding to given index */
-#define idx2bit(i)              ((binmap_t)(1) << (i))
-
-/* Mark/Clear bits with given index */
-#define mark_smallmap(M,i)      ((M)->smallmap |=  idx2bit(i))
-#define clear_smallmap(M,i)     ((M)->smallmap &= ~idx2bit(i))
-#define smallmap_is_marked(M,i) ((M)->smallmap &   idx2bit(i))
-
-#define mark_treemap(M,i)       ((M)->treemap  |=  idx2bit(i))
-#define clear_treemap(M,i)      ((M)->treemap  &= ~idx2bit(i))
-#define treemap_is_marked(M,i)  ((M)->treemap  &   idx2bit(i))
-
-/* isolate the least set bit of a bitmap */
-#define least_bit(x)         ((x) & -(x))
-
-/* mask with all bits to left of least bit of x on */
-#define left_bits(x)         ((x<<1) | -(x<<1))
-
-/* mask with all bits to left of or equal to least bit of x on */
-#define same_or_left_bits(x) ((x) | -(x))
-
-/* index corresponding to given bit. Use x86 asm if possible */
-
-#if defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-#define compute_bit2idx(X, I)\
-{\
-  unsigned int J;\
-  J = __builtin_ctz(X); \
-  I = (bindex_t)J;\
-}
-
-#elif defined (__INTEL_COMPILER)
-#define compute_bit2idx(X, I)\
-{\
-  unsigned int J;\
-  J = _bit_scan_forward (X); \
-  I = (bindex_t)J;\
-}
-
-#elif defined(_MSC_VER) && _MSC_VER>=1300
-#define compute_bit2idx(X, I)\
-{\
-  unsigned int J;\
-  _BitScanForward((DWORD *) &J, X);\
-  I = (bindex_t)J;\
-}
-
-#elif USE_BUILTIN_FFS
-#define compute_bit2idx(X, I) I = ffs(X)-1
-
-#else
-#define compute_bit2idx(X, I)\
-{\
-  unsigned int Y = X - 1;\
-  unsigned int K = Y >> (16-4) & 16;\
-  unsigned int N = K;        Y >>= K;\
-  N += K = Y >> (8-3) &  8;  Y >>= K;\
-  N += K = Y >> (4-2) &  4;  Y >>= K;\
-  N += K = Y >> (2-1) &  2;  Y >>= K;\
-  N += K = Y >> (1-0) &  1;  Y >>= K;\
-  I = (bindex_t)(N + Y);\
-}
-#endif /* GNUC */
-
-
-/* ----------------------- Runtime Check Support ------------------------- */
-
-/*
-  For security, the main invariant is that malloc/free/etc never
-  writes to a static address other than malloc_state, unless static
-  malloc_state itself has been corrupted, which cannot occur via
-  malloc (because of these checks). In essence this means that we
-  believe all pointers, sizes, maps etc held in malloc_state, but
-  check all of those linked or offsetted from other embedded data
-  structures.  These checks are interspersed with main code in a way
-  that tends to minimize their run-time cost.
-
-  When FOOTERS is defined, in addition to range checking, we also
-  verify footer fields of inuse chunks, which can be used guarantee
-  that the mstate controlling malloc/free is intact.  This is a
-  streamlined version of the approach described by William Robertson
-  et al in "Run-time Detection of Heap-based Overflows" LISA'03
-  http://www.usenix.org/events/lisa03/tech/robertson.html The footer
-  of an inuse chunk holds the xor of its mstate and a random seed,
-  that is checked upon calls to free() and realloc().  This is
-  (probabalistically) unguessable from outside the program, but can be
-  computed by any code successfully malloc'ing any chunk, so does not
-  itself provide protection against code that has already broken
-  security through some other means.  Unlike Robertson et al, we
-  always dynamically check addresses of all offset chunks (previous,
-  next, etc). This turns out to be cheaper than relying on hashes.
-*/
-
-#if !INSECURE
-/* Check if address a is at least as high as any from MORECORE or MMAP */
-#define ok_address(M, a) ((char*)(a) >= (M)->least_addr)
-/* Check if address of next chunk n is higher than base chunk p */
-#define ok_next(p, n)    ((char*)(p) < (char*)(n))
-/* Check if p has inuse status */
-#define ok_inuse(p)     is_inuse(p)
-/* Check if p has its pinuse bit on */
-#define ok_pinuse(p)     pinuse(p)
-
-#else /* !INSECURE */
-#define ok_address(M, a) (1)
-#define ok_next(b, n)    (1)
-#define ok_inuse(p)      (1)
-#define ok_pinuse(p)     (1)
-#endif /* !INSECURE */
-
-#if (FOOTERS && !INSECURE)
-/* Check if (alleged) mstate m has expected magic field */
-#define ok_magic(M)      ((M)->magic == mparams.magic)
-#else  /* (FOOTERS && !INSECURE) */
-#define ok_magic(M)      (1)
-#endif /* (FOOTERS && !INSECURE) */
-
-/* In gcc, use __builtin_expect to minimize impact of checks */
-#if !INSECURE
-#if defined(__GNUC__) && __GNUC__ >= 3
-#define RTCHECK(e)  __builtin_expect(e, 1)
-#else /* GNUC */
-#define RTCHECK(e)  (e)
-#endif /* GNUC */
-#else /* !INSECURE */
-#define RTCHECK(e)  (1)
-#endif /* !INSECURE */
-
-/* macros to set up inuse chunks with or without footers */
-
-#if !FOOTERS
-
-#define mark_inuse_foot(M,p,s)
-
-/* Macros for setting head/foot of non-mmapped chunks */
-
-/* Set cinuse bit and pinuse bit of next chunk */
-#define set_inuse(M,p,s)\
-  ((p)->head = (((p)->head & PINUSE_BIT)|s|CINUSE_BIT),\
-  ((mchunkptr)(((char*)(p)) + (s)))->head |= PINUSE_BIT)
-
-/* Set cinuse and pinuse of this chunk and pinuse of next chunk */
-#define set_inuse_and_pinuse(M,p,s)\
-  ((p)->head = (s|PINUSE_BIT|CINUSE_BIT),\
-  ((mchunkptr)(((char*)(p)) + (s)))->head |= PINUSE_BIT)
-
-/* Set size, cinuse and pinuse bit of this chunk */
-#define set_size_and_pinuse_of_inuse_chunk(M, p, s)\
-  ((p)->head = (s|PINUSE_BIT|CINUSE_BIT))
-
-#else /* FOOTERS */
-
-/* Set foot of inuse chunk to be xor of mstate and seed */
-#define mark_inuse_foot(M,p,s)\
-  (((mchunkptr)((char*)(p) + (s)))->prev_foot = ((size_t)(M) ^ mparams.magic))
-
-#define get_mstate_for(p)\
-  ((mstate)(((mchunkptr)((char*)(p) +\
-    (chunksize(p))))->prev_foot ^ mparams.magic))
-
-#define set_inuse(M,p,s)\
-  ((p)->head = (((p)->head & PINUSE_BIT)|s|CINUSE_BIT),\
-  (((mchunkptr)(((char*)(p)) + (s)))->head |= PINUSE_BIT), \
-  mark_inuse_foot(M,p,s))
-
-#define set_inuse_and_pinuse(M,p,s)\
-  ((p)->head = (s|PINUSE_BIT|CINUSE_BIT),\
-  (((mchunkptr)(((char*)(p)) + (s)))->head |= PINUSE_BIT),\
- mark_inuse_foot(M,p,s))
-
-#define set_size_and_pinuse_of_inuse_chunk(M, p, s)\
-  ((p)->head = (s|PINUSE_BIT|CINUSE_BIT),\
-  mark_inuse_foot(M, p, s))
-
-#endif /* !FOOTERS */
-
-/* ---------------------------- setting mparams -------------------------- */
-
-#if LOCK_AT_FORK
-static void pre_fork(void)         { ACQUIRE_LOCK(&(gm)->mutex); }
-static void post_fork_parent(void) { RELEASE_LOCK(&(gm)->mutex); }
-static void post_fork_child(void)  { INITIAL_LOCK(&(gm)->mutex); }
-#endif /* LOCK_AT_FORK */
-
-/* Initialize mparams */
-static int init_mparams(void) {
-#ifdef NEED_GLOBAL_LOCK_INIT
-  if (malloc_global_mutex_status <= 0)
-    init_malloc_global_mutex();
-#endif
-
-  ACQUIRE_MALLOC_GLOBAL_LOCK();
-  if (mparams.magic == 0) {
-    size_t magic;
-    size_t psize;
-    size_t gsize;
-
-#ifndef WIN32
-    psize = malloc_getpagesize;
-    gsize = ((DEFAULT_GRANULARITY != 0)? DEFAULT_GRANULARITY : psize);
-#else /* WIN32 */
-    {
-      SYSTEM_INFO system_info;
-      GetSystemInfo(&system_info);
-      psize = system_info.dwPageSize;
-      gsize = ((DEFAULT_GRANULARITY != 0)?
-               DEFAULT_GRANULARITY : system_info.dwAllocationGranularity);
-    }
-#endif /* WIN32 */
-
-    /* Sanity-check configuration:
-       size_t must be unsigned and as wide as pointer type.
-       ints must be at least 4 bytes.
-       alignment must be at least 8.
-       Alignment, min chunk size, and page size must all be powers of 2.
-    */
-    if ((sizeof(size_t) != sizeof(char*)) ||
-        (MAX_SIZE_T < MIN_CHUNK_SIZE)  ||
-        (sizeof(int) < 4)  ||
-        (MALLOC_ALIGNMENT < (size_t)8U) ||
-        ((MALLOC_ALIGNMENT & (MALLOC_ALIGNMENT-SIZE_T_ONE)) != 0) ||
-        ((MCHUNK_SIZE      & (MCHUNK_SIZE-SIZE_T_ONE))      != 0) ||
-        ((gsize            & (gsize-SIZE_T_ONE))            != 0) ||
-        ((psize            & (psize-SIZE_T_ONE))            != 0))
-      ABORT;
-    mparams.granularity = gsize;
-    mparams.page_size = psize;
-    mparams.mmap_threshold = DEFAULT_MMAP_THRESHOLD;
-    mparams.trim_threshold = DEFAULT_TRIM_THRESHOLD;
-#if MORECORE_CONTIGUOUS
-    mparams.default_mflags = USE_LOCK_BIT|USE_MMAP_BIT;
-#else  /* MORECORE_CONTIGUOUS */
-    mparams.default_mflags = USE_LOCK_BIT|USE_MMAP_BIT|USE_NONCONTIGUOUS_BIT;
-#endif /* MORECORE_CONTIGUOUS */
-
-#if !ONLY_MSPACES
-    /* Set up lock for main malloc area */
-    gm->mflags = mparams.default_mflags;
-    (void)INITIAL_LOCK(&gm->mutex);
-#endif
-#if LOCK_AT_FORK
-    pthread_atfork(&pre_fork, &post_fork_parent, &post_fork_child);
-#endif
-
-    {
-#if USE_DEV_RANDOM
-      int fd;
-      unsigned char buf[sizeof(size_t)];
-      /* Try to use /dev/urandom, else fall back on using time */
-      if ((fd = open("/dev/urandom", O_RDONLY)) >= 0 &&
-          read(fd, buf, sizeof(buf)) == sizeof(buf)) {
-        magic = *((size_t *) buf);
-        close(fd);
-      }
-      else
-#endif /* USE_DEV_RANDOM */
-#ifdef WIN32
-      magic = (size_t)(GetTickCount() ^ (size_t)0x55555555U);
-#elif defined(LACKS_TIME_H)
-      magic = (size_t)&magic ^ (size_t)0x55555555U;
-#else
-      magic = (size_t)(time(0) ^ (size_t)0x55555555U);
-#endif
-      magic |= (size_t)8U;    /* ensure nonzero */
-      magic &= ~(size_t)7U;   /* improve chances of fault for bad values */
-      /* Until memory modes commonly available, use volatile-write */
-      (*(volatile size_t *)(&(mparams.magic))) = magic;
-    }
-  }
-
-  RELEASE_MALLOC_GLOBAL_LOCK();
-  return 1;
-}
-
-/* support for mallopt */
-static int change_mparam(int param_number, int value) {
-  size_t val;
-  ensure_initialization();
-  val = (value == -1)? MAX_SIZE_T : (size_t)value;
-  switch(param_number) {
-  case M_TRIM_THRESHOLD:
-    mparams.trim_threshold = val;
-    return 1;
-  case M_GRANULARITY:
-    if (val >= mparams.page_size && ((val & (val-1)) == 0)) {
-      mparams.granularity = val;
-      return 1;
-    }
-    else
-      return 0;
-  case M_MMAP_THRESHOLD:
-    mparams.mmap_threshold = val;
-    return 1;
-  default:
-    return 0;
-  }
-}
-
-#if DEBUG
-/* ------------------------- Debugging Support --------------------------- */
-
-/* Check properties of any chunk, whether free, inuse, mmapped etc  */
-static void do_check_any_chunk(mstate m, mchunkptr p) {
-  assert((is_aligned(chunk2mem(p))) || (p->head == FENCEPOST_HEAD));
-  assert(ok_address(m, p));
-}
-
-/* Check properties of top chunk */
-static void do_check_top_chunk(mstate m, mchunkptr p) {
-  msegmentptr sp = segment_holding(m, (char*)p);
-  size_t  sz = p->head & ~INUSE_BITS; /* third-lowest bit can be set! */
-  assert(sp != 0);
-  assert((is_aligned(chunk2mem(p))) || (p->head == FENCEPOST_HEAD));
-  assert(ok_address(m, p));
-  assert(sz == m->topsize);
-  assert(sz > 0);
-  assert(sz == ((sp->base + sp->size) - (char*)p) - TOP_FOOT_SIZE);
-  assert(pinuse(p));
-  assert(!pinuse(chunk_plus_offset(p, sz)));
-}
-
-/* Check properties of (inuse) mmapped chunks */
-static void do_check_mmapped_chunk(mstate m, mchunkptr p) {
-  size_t  sz = chunksize(p);
-  size_t len = (sz + (p->prev_foot) + MMAP_FOOT_PAD);
-  assert(is_mmapped(p));
-  assert(use_mmap(m));
-  assert((is_aligned(chunk2mem(p))) || (p->head == FENCEPOST_HEAD));
-  assert(ok_address(m, p));
-  assert(!is_small(sz));
-  assert((len & (mparams.page_size-SIZE_T_ONE)) == 0);
-  assert(chunk_plus_offset(p, sz)->head == FENCEPOST_HEAD);
-  assert(chunk_plus_offset(p, sz+SIZE_T_SIZE)->head == 0);
-}
-
-/* Check properties of inuse chunks */
-static void do_check_inuse_chunk(mstate m, mchunkptr p) {
-  do_check_any_chunk(m, p);
-  assert(is_inuse(p));
-  assert(next_pinuse(p));
-  /* If not pinuse and not mmapped, previous chunk has OK offset */
-  assert(is_mmapped(p) || pinuse(p) || next_chunk(prev_chunk(p)) == p);
-  if (is_mmapped(p))
-    do_check_mmapped_chunk(m, p);
-}
-
-/* Check properties of free chunks */
-static void do_check_free_chunk(mstate m, mchunkptr p) {
-  size_t sz = chunksize(p);
-  mchunkptr next = chunk_plus_offset(p, sz);
-  do_check_any_chunk(m, p);
-  assert(!is_inuse(p));
-  assert(!next_pinuse(p));
-  assert (!is_mmapped(p));
-  if (p != m->dv && p != m->top) {
-    if (sz >= MIN_CHUNK_SIZE) {
-      assert((sz & CHUNK_ALIGN_MASK) == 0);
-      assert(is_aligned(chunk2mem(p)));
-      assert(next->prev_foot == sz);
-      assert(pinuse(p));
-      assert (next == m->top || is_inuse(next));
-      assert(p->fd->bk == p);
-      assert(p->bk->fd == p);
-    }
-    else  /* markers are always of size SIZE_T_SIZE */
-      assert(sz == SIZE_T_SIZE);
-  }
-}
-
-/* Check properties of malloced chunks at the point they are malloced */
-static void do_check_malloced_chunk(mstate m, void* mem, size_t s) {
-  if (mem != 0) {
-    mchunkptr p = mem2chunk(mem);
-    size_t sz = p->head & ~INUSE_BITS;
-    do_check_inuse_chunk(m, p);
-    assert((sz & CHUNK_ALIGN_MASK) == 0);
-    assert(sz >= MIN_CHUNK_SIZE);
-    assert(sz >= s);
-    /* unless mmapped, size is less than MIN_CHUNK_SIZE more than request */
-    assert(is_mmapped(p) || sz < (s + MIN_CHUNK_SIZE));
-  }
-}
-
-/* Check a tree and its subtrees.  */
-static void do_check_tree(mstate m, tchunkptr t) {
-  tchunkptr head = 0;
-  tchunkptr u = t;
-  bindex_t tindex = t->index;
-  size_t tsize = chunksize(t);
-  bindex_t idx;
-  compute_tree_index(tsize, idx);
-  assert(tindex == idx);
-  assert(tsize >= MIN_LARGE_SIZE);
-  assert(tsize >= minsize_for_tree_index(idx));
-  assert((idx == NTREEBINS-1) || (tsize < minsize_for_tree_index((idx+1))));
-
-  do { /* traverse through chain of same-sized nodes */
-    do_check_any_chunk(m, ((mchunkptr)u));
-    assert(u->index == tindex);
-    assert(chunksize(u) == tsize);
-    assert(!is_inuse(u));
-    assert(!next_pinuse(u));
-    assert(u->fd->bk == u);
-    assert(u->bk->fd == u);
-    if (u->parent == 0) {
-      assert(u->child[0] == 0);
-      assert(u->child[1] == 0);
-    }
-    else {
-      assert(head == 0); /* only one node on chain has parent */
-      head = u;
-      assert(u->parent != u);
-      assert (u->parent->child[0] == u ||
-              u->parent->child[1] == u ||
-              *((tbinptr*)(u->parent)) == u);
-      if (u->child[0] != 0) {
-        assert(u->child[0]->parent == u);
-        assert(u->child[0] != u);
-        do_check_tree(m, u->child[0]);
-      }
-      if (u->child[1] != 0) {
-        assert(u->child[1]->parent == u);
-        assert(u->child[1] != u);
-        do_check_tree(m, u->child[1]);
-      }
-      if (u->child[0] != 0 && u->child[1] != 0) {
-        assert(chunksize(u->child[0]) < chunksize(u->child[1]));
-      }
-    }
-    u = u->fd;
-  } while (u != t);
-  assert(head != 0);
-}
-
-/*  Check all the chunks in a treebin.  */
-static void do_check_treebin(mstate m, bindex_t i) {
-  tbinptr* tb = treebin_at(m, i);
-  tchunkptr t = *tb;
-  int empty = (m->treemap & (1U << i)) == 0;
-  if (t == 0)
-    assert(empty);
-  if (!empty)
-    do_check_tree(m, t);
-}
-
-/*  Check all the chunks in a smallbin.  */
-static void do_check_smallbin(mstate m, bindex_t i) {
-  sbinptr b = smallbin_at(m, i);
-  mchunkptr p = b->bk;
-  unsigned int empty = (m->smallmap & (1U << i)) == 0;
-  if (p == b)
-    assert(empty);
-  if (!empty) {
-    for (; p != b; p = p->bk) {
-      size_t size = chunksize(p);
-      mchunkptr q;
-      /* each chunk claims to be free */
-      do_check_free_chunk(m, p);
-      /* chunk belongs in bin */
-      assert(small_index(size) == i);
-      assert(p->bk == b || chunksize(p->bk) == chunksize(p));
-      /* chunk is followed by an inuse chunk */
-      q = next_chunk(p);
-      if (q->head != FENCEPOST_HEAD)
-        do_check_inuse_chunk(m, q);
-    }
-  }
-}
-
-/* Find x in a bin. Used in other check functions. */
-static int bin_find(mstate m, mchunkptr x) {
-  size_t size = chunksize(x);
-  if (is_small(size)) {
-    bindex_t sidx = small_index(size);
-    sbinptr b = smallbin_at(m, sidx);
-    if (smallmap_is_marked(m, sidx)) {
-      mchunkptr p = b;
-      do {
-        if (p == x)
-          return 1;
-      } while ((p = p->fd) != b);
-    }
-  }
-  else {
-    bindex_t tidx;
-    compute_tree_index(size, tidx);
-    if (treemap_is_marked(m, tidx)) {
-      tchunkptr t = *treebin_at(m, tidx);
-      size_t sizebits = size << leftshift_for_tree_index(tidx);
-      while (t != 0 && chunksize(t) != size) {
-        t = t->child[(sizebits >> (SIZE_T_BITSIZE-SIZE_T_ONE)) & 1];
-        sizebits <<= 1;
-      }
-      if (t != 0) {
-        tchunkptr u = t;
-        do {
-          if (u == (tchunkptr)x)
-            return 1;
-        } while ((u = u->fd) != t);
-      }
-    }
-  }
-  return 0;
-}
-
-/* Traverse each chunk and check it; return total */
-static size_t traverse_and_check(mstate m) {
-  size_t sum = 0;
-  if (is_initialized(m)) {
-    msegmentptr s = &m->seg;
-    sum += m->topsize + TOP_FOOT_SIZE;
-    while (s != 0) {
-      mchunkptr q = align_as_chunk(s->base);
-      mchunkptr lastq = 0;
-      assert(pinuse(q));
-      while (segment_holds(s, q) &&
-             q != m->top && q->head != FENCEPOST_HEAD) {
-        sum += chunksize(q);
-        if (is_inuse(q)) {
-          assert(!bin_find(m, q));
-          do_check_inuse_chunk(m, q);
-        }
-        else {
-          assert(q == m->dv || bin_find(m, q));
-          assert(lastq == 0 || is_inuse(lastq)); /* Not 2 consecutive free */
-          do_check_free_chunk(m, q);
-        }
-        lastq = q;
-        q = next_chunk(q);
-      }
-      s = s->next;
-    }
-  }
-  return sum;
-}
-
-
-/* Check all properties of malloc_state. */
-static void do_check_malloc_state(mstate m) {
-  bindex_t i;
-  size_t total;
-  /* check bins */
-  for (i = 0; i < NSMALLBINS; ++i)
-    do_check_smallbin(m, i);
-  for (i = 0; i < NTREEBINS; ++i)
-    do_check_treebin(m, i);
-
-  if (m->dvsize != 0) { /* check dv chunk */
-    do_check_any_chunk(m, m->dv);
-    assert(m->dvsize == chunksize(m->dv));
-    assert(m->dvsize >= MIN_CHUNK_SIZE);
-    assert(bin_find(m, m->dv) == 0);
-  }
-
-  if (m->top != 0) {   /* check top chunk */
-    do_check_top_chunk(m, m->top);
-    /*assert(m->topsize == chunksize(m->top)); redundant */
-    assert(m->topsize > 0);
-    assert(bin_find(m, m->top) == 0);
-  }
-
-  total = traverse_and_check(m);
-  assert(total <= m->footprint);
-  assert(m->footprint <= m->max_footprint);
-}
-#endif /* DEBUG */
-
-/* ----------------------------- statistics ------------------------------ */
-
-#if !NO_MALLINFO
-static struct mallinfo internal_mallinfo(mstate m) {
-  struct mallinfo nm = { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 };
-  ensure_initialization();
-  if (!PREACTION(m)) {
-    check_malloc_state(m);
-    if (is_initialized(m)) {
-      size_t nfree = SIZE_T_ONE; /* top always free */
-      size_t mfree = m->topsize + TOP_FOOT_SIZE;
-      size_t sum = mfree;
-      msegmentptr s = &m->seg;
-      while (s != 0) {
-        mchunkptr q = align_as_chunk(s->base);
-        while (segment_holds(s, q) &&
-               q != m->top && q->head != FENCEPOST_HEAD) {
-          size_t sz = chunksize(q);
-          sum += sz;
-          if (!is_inuse(q)) {
-            mfree += sz;
-            ++nfree;
-          }
-          q = next_chunk(q);
-        }
-        s = s->next;
-      }
-
-      nm.arena    = sum;
-      nm.ordblks  = nfree;
-      nm.hblkhd   = m->footprint - sum;
-      nm.usmblks  = m->max_footprint;
-      nm.uordblks = m->footprint - mfree;
-      nm.fordblks = mfree;
-      nm.keepcost = m->topsize;
-    }
-
-    POSTACTION(m);
-  }
-  return nm;
-}
-#endif /* !NO_MALLINFO */
-
-#if !NO_MALLOC_STATS
-static void internal_malloc_stats(mstate m) {
-  ensure_initialization();
-  if (!PREACTION(m)) {
-    size_t maxfp = 0;
-    size_t fp = 0;
-    size_t used = 0;
-    check_malloc_state(m);
-    if (is_initialized(m)) {
-      msegmentptr s = &m->seg;
-      maxfp = m->max_footprint;
-      fp = m->footprint;
-      used = fp - (m->topsize + TOP_FOOT_SIZE);
-
-      while (s != 0) {
-        mchunkptr q = align_as_chunk(s->base);
-        while (segment_holds(s, q) &&
-               q != m->top && q->head != FENCEPOST_HEAD) {
-          if (!is_inuse(q))
-            used -= chunksize(q);
-          q = next_chunk(q);
-        }
-        s = s->next;
-      }
-    }
-    POSTACTION(m); /* drop lock */
-    fprintf(stderr, "max system bytes = %10lu\n", (unsigned long)(maxfp));
-    fprintf(stderr, "system bytes     = %10lu\n", (unsigned long)(fp));
-    fprintf(stderr, "in use bytes     = %10lu\n", (unsigned long)(used));
-  }
-}
-#endif /* NO_MALLOC_STATS */
-
-/* ----------------------- Operations on smallbins ----------------------- */
-
-/*
-  Various forms of linking and unlinking are defined as macros.  Even
-  the ones for trees, which are very long but have very short typical
-  paths.  This is ugly but reduces reliance on inlining support of
-  compilers.
-*/
-
-/* Link a free chunk into a smallbin  */
-#define insert_small_chunk(M, P, S) {\
-  bindex_t I  = small_index(S);\
-  mchunkptr B = smallbin_at(M, I);\
-  mchunkptr F = B;\
-  assert(S >= MIN_CHUNK_SIZE);\
-  if (!smallmap_is_marked(M, I))\
-    mark_smallmap(M, I);\
-  else if (RTCHECK(ok_address(M, B->fd)))\
-    F = B->fd;\
-  else {\
-    CORRUPTION_ERROR_ACTION(M);\
-  }\
-  B->fd = P;\
-  F->bk = P;\
-  P->fd = F;\
-  P->bk = B;\
-}
-
-/* Unlink a chunk from a smallbin  */
-#define unlink_small_chunk(M, P, S) {\
-  mchunkptr F = P->fd;\
-  mchunkptr B = P->bk;\
-  bindex_t I = small_index(S);\
-  assert(P != B);\
-  assert(P != F);\
-  assert(chunksize(P) == small_index2size(I));\
-  if (RTCHECK(F == smallbin_at(M,I) || (ok_address(M, F) && F->bk == P))) { \
-    if (B == F) {\
-      clear_smallmap(M, I);\
-    }\
-    else if (RTCHECK(B == smallbin_at(M,I) ||\
-                     (ok_address(M, B) && B->fd == P))) {\
-      F->bk = B;\
-      B->fd = F;\
-    }\
-    else {\
-      CORRUPTION_ERROR_ACTION(M);\
-    }\
-  }\
-  else {\
-    CORRUPTION_ERROR_ACTION(M);\
-  }\
-}
-
-/* Unlink the first chunk from a smallbin */
-#define unlink_first_small_chunk(M, B, P, I) {\
-  mchunkptr F = P->fd;\
-  assert(P != B);\
-  assert(P != F);\
-  assert(chunksize(P) == small_index2size(I));\
-  if (B == F) {\
-    clear_smallmap(M, I);\
-  }\
-  else if (RTCHECK(ok_address(M, F) && F->bk == P)) {\
-    F->bk = B;\
-    B->fd = F;\
-  }\
-  else {\
-    CORRUPTION_ERROR_ACTION(M);\
-  }\
-}
-
-/* Replace dv node, binning the old one */
-/* Used only when dvsize known to be small */
-#define replace_dv(M, P, S) {\
-  size_t DVS = M->dvsize;\
-  assert(is_small(DVS));\
-  if (DVS != 0) {\
-    mchunkptr DV = M->dv;\
-    insert_small_chunk(M, DV, DVS);\
-  }\
-  M->dvsize = S;\
-  M->dv = P;\
-}
-
-/* ------------------------- Operations on trees ------------------------- */
-
-/* Insert chunk into tree */
-#define insert_large_chunk(M, X, S) {\
-  tbinptr* H;\
-  bindex_t I;\
-  compute_tree_index(S, I);\
-  H = treebin_at(M, I);\
-  X->index = I;\
-  X->child[0] = X->child[1] = 0;\
-  if (!treemap_is_marked(M, I)) {\
-    mark_treemap(M, I);\
-    *H = X;\
-    X->parent = (tchunkptr)H;\
-    X->fd = X->bk = X;\
-  }\
-  else {\
-    tchunkptr T = *H;\
-    size_t K = S << leftshift_for_tree_index(I);\
-    for (;;) {\
-      if (chunksize(T) != S) {\
-        tchunkptr* C = &(T->child[(K >> (SIZE_T_BITSIZE-SIZE_T_ONE)) & 1]);\
-        K <<= 1;\
-        if (*C != 0)\
-          T = *C;\
-        else if (RTCHECK(ok_address(M, C))) {\
-          *C = X;\
-          X->parent = T;\
-          X->fd = X->bk = X;\
-          break;\
-        }\
-        else {\
-          CORRUPTION_ERROR_ACTION(M);\
-          break;\
-        }\
-      }\
-      else {\
-        tchunkptr F = T->fd;\
-        if (RTCHECK(ok_address(M, T) && ok_address(M, F))) {\
-          T->fd = F->bk = X;\
-          X->fd = F;\
-          X->bk = T;\
-          X->parent = 0;\
-          break;\
-        }\
-        else {\
-          CORRUPTION_ERROR_ACTION(M);\
-          break;\
-        }\
-      }\
-    }\
-  }\
-}
-
-/*
-  Unlink steps:
-
-  1. If x is a chained node, unlink it from its same-sized fd/bk links
-     and choose its bk node as its replacement.
-  2. If x was the last node of its size, but not a leaf node, it must
-     be replaced with a leaf node (not merely one with an open left or
-     right), to make sure that lefts and rights of descendents
-     correspond properly to bit masks.  We use the rightmost descendent
-     of x.  We could use any other leaf, but this is easy to locate and
-     tends to counteract removal of leftmosts elsewhere, and so keeps
-     paths shorter than minimally guaranteed.  This doesn't loop much
-     because on average a node in a tree is near the bottom.
-  3. If x is the base of a chain (i.e., has parent links) relink
-     x's parent and children to x's replacement (or null if none).
-*/
-
-#define unlink_large_chunk(M, X) {\
-  tchunkptr XP = X->parent;\
-  tchunkptr R;\
-  if (X->bk != X) {\
-    tchunkptr F = X->fd;\
-    R = X->bk;\
-    if (RTCHECK(ok_address(M, F) && F->bk == X && R->fd == X)) {\
-      F->bk = R;\
-      R->fd = F;\
-    }\
-    else {\
-      CORRUPTION_ERROR_ACTION(M);\
-    }\
-  }\
-  else {\
-    tchunkptr* RP;\
-    if (((R = *(RP = &(X->child[1]))) != 0) ||\
-        ((R = *(RP = &(X->child[0]))) != 0)) {\
-      tchunkptr* CP;\
-      while ((*(CP = &(R->child[1])) != 0) ||\
-             (*(CP = &(R->child[0])) != 0)) {\
-        R = *(RP = CP);\
-      }\
-      if (RTCHECK(ok_address(M, RP)))\
-        *RP = 0;\
-      else {\
-        CORRUPTION_ERROR_ACTION(M);\
-      }\
-    }\
-  }\
-  if (XP != 0) {\
-    tbinptr* H = treebin_at(M, X->index);\
-    if (X == *H) {\
-      if ((*H = R) == 0) \
-        clear_treemap(M, X->index);\
-    }\
-    else if (RTCHECK(ok_address(M, XP))) {\
-      if (XP->child[0] == X) \
-        XP->child[0] = R;\
-      else \
-        XP->child[1] = R;\
-    }\
-    else\
-      CORRUPTION_ERROR_ACTION(M);\
-    if (R != 0) {\
-      if (RTCHECK(ok_address(M, R))) {\
-        tchunkptr C0, C1;\
-        R->parent = XP;\
-        if ((C0 = X->child[0]) != 0) {\
-          if (RTCHECK(ok_address(M, C0))) {\
-            R->child[0] = C0;\
-            C0->parent = R;\
-          }\
-          else\
-            CORRUPTION_ERROR_ACTION(M);\
-        }\
-        if ((C1 = X->child[1]) != 0) {\
-          if (RTCHECK(ok_address(M, C1))) {\
-            R->child[1] = C1;\
-            C1->parent = R;\
-          }\
-          else\
-            CORRUPTION_ERROR_ACTION(M);\
-        }\
-      }\
-      else\
-        CORRUPTION_ERROR_ACTION(M);\
-    }\
-  }\
-}
-
-/* Relays to large vs small bin operations */
-
-#define insert_chunk(M, P, S)\
-  if (is_small(S)) insert_small_chunk(M, P, S)\
-  else { tchunkptr TP = (tchunkptr)(P); insert_large_chunk(M, TP, S); }
-
-#define unlink_chunk(M, P, S)\
-  if (is_small(S)) unlink_small_chunk(M, P, S)\
-  else { tchunkptr TP = (tchunkptr)(P); unlink_large_chunk(M, TP); }
-
-
-/* Relays to internal calls to malloc/free from realloc, memalign etc */
-
-#if ONLY_MSPACES
-#define internal_malloc(m, b) mspace_malloc(m, b)
-#define internal_free(m, mem) mspace_free(m,mem);
-#else /* ONLY_MSPACES */
-#if MSPACES
-#define internal_malloc(m, b)\
-  ((m == gm)? dlmalloc(b) : mspace_malloc(m, b))
-#define internal_free(m, mem)\
-   if (m == gm) dlfree(mem); else mspace_free(m,mem);
-#else /* MSPACES */
-#define internal_malloc(m, b) dlmalloc(b)
-#define internal_free(m, mem) dlfree(mem)
-#endif /* MSPACES */
-#endif /* ONLY_MSPACES */
-
-/* -----------------------  Direct-mmapping chunks ----------------------- */
-
-/*
-  Directly mmapped chunks are set up with an offset to the start of
-  the mmapped region stored in the prev_foot field of the chunk. This
-  allows reconstruction of the required argument to MUNMAP when freed,
-  and also allows adjustment of the returned chunk to meet alignment
-  requirements (especially in memalign).
-*/
-
-/* Malloc using mmap */
-static void* mmap_alloc(mstate m, size_t nb) {
-  size_t mmsize = mmap_align(nb + SIX_SIZE_T_SIZES + CHUNK_ALIGN_MASK);
-  if (m->footprint_limit != 0) {
-    size_t fp = m->footprint + mmsize;
-    if (fp <= m->footprint || fp > m->footprint_limit)
-      return 0;
-  }
-  if (mmsize > nb) {     /* Check for wrap around 0 */
-    char* mm = (char*)(CALL_DIRECT_MMAP(mmsize));
-    if (mm != CMFAIL) {
-      size_t offset = align_offset(chunk2mem(mm));
-      size_t psize = mmsize - offset - MMAP_FOOT_PAD;
-      mchunkptr p = (mchunkptr)(mm + offset);
-      p->prev_foot = offset;
-      p->head = psize;
-      mark_inuse_foot(m, p, psize);
-      chunk_plus_offset(p, psize)->head = FENCEPOST_HEAD;
-      chunk_plus_offset(p, psize+SIZE_T_SIZE)->head = 0;
-
-      if (m->least_addr == 0 || mm < m->least_addr)
-        m->least_addr = mm;
-      if ((m->footprint += mmsize) > m->max_footprint)
-        m->max_footprint = m->footprint;
-      assert(is_aligned(chunk2mem(p)));
-      check_mmapped_chunk(m, p);
-      return chunk2mem(p);
-    }
-  }
-  return 0;
-}
-
-/* Realloc using mmap */
-static mchunkptr mmap_resize(mstate m, mchunkptr oldp, size_t nb, int flags) {
-  size_t oldsize = chunksize(oldp);
-  (void)flags; /* placate people compiling -Wunused */
-  if (is_small(nb)) /* Can't shrink mmap regions below small size */
-    return 0;
-  /* Keep old chunk if big enough but not too big */
-  if (oldsize >= nb + SIZE_T_SIZE &&
-      (oldsize - nb) <= (mparams.granularity << 1))
-    return oldp;
-  else {
-    size_t offset = oldp->prev_foot;
-    size_t oldmmsize = oldsize + offset + MMAP_FOOT_PAD;
-    size_t newmmsize = mmap_align(nb + SIX_SIZE_T_SIZES + CHUNK_ALIGN_MASK);
-    char* cp = (char*)CALL_MREMAP((char*)oldp - offset,
-                                  oldmmsize, newmmsize, flags);
-    if (cp != CMFAIL) {
-      mchunkptr newp = (mchunkptr)(cp + offset);
-      size_t psize = newmmsize - offset - MMAP_FOOT_PAD;
-      newp->head = psize;
-      mark_inuse_foot(m, newp, psize);
-      chunk_plus_offset(newp, psize)->head = FENCEPOST_HEAD;
-      chunk_plus_offset(newp, psize+SIZE_T_SIZE)->head = 0;
-
-      if (cp < m->least_addr)
-        m->least_addr = cp;
-      if ((m->footprint += newmmsize - oldmmsize) > m->max_footprint)
-        m->max_footprint = m->footprint;
-      check_mmapped_chunk(m, newp);
-      return newp;
-    }
-  }
-  return 0;
-}
-
-
-/* -------------------------- mspace management -------------------------- */
-
-/* Initialize top chunk and its size */
-static void init_top(mstate m, mchunkptr p, size_t psize) {
-  /* Ensure alignment */
-  size_t offset = align_offset(chunk2mem(p));
-  p = (mchunkptr)((char*)p + offset);
-  psize -= offset;
-
-  m->top = p;
-  m->topsize = psize;
-  p->head = psize | PINUSE_BIT;
-  /* set size of fake trailing chunk holding overhead space only once */
-  chunk_plus_offset(p, psize)->head = TOP_FOOT_SIZE;
-  m->trim_check = mparams.trim_threshold; /* reset on each update */
-}
-
-/* Initialize bins for a new mstate that is otherwise zeroed out */
-static void init_bins(mstate m) {
-  /* Establish circular links for smallbins */
-  bindex_t i;
-  for (i = 0; i < NSMALLBINS; ++i) {
-    sbinptr bin = smallbin_at(m,i);
-    bin->fd = bin->bk = bin;
-  }
-}
-
-#if PROCEED_ON_ERROR
-
-/* default corruption action */
-static void reset_on_error(mstate m) {
-  int i;
-  ++malloc_corruption_error_count;
-  /* Reinitialize fields to forget about all memory */
-  m->smallmap = m->treemap = 0;
-  m->dvsize = m->topsize = 0;
-  m->seg.base = 0;
-  m->seg.size = 0;
-  m->seg.next = 0;
-  m->top = m->dv = 0;
-  for (i = 0; i < NTREEBINS; ++i)
-    *treebin_at(m, i) = 0;
-  init_bins(m);
-}
-#endif /* PROCEED_ON_ERROR */
-
-/* Allocate chunk and prepend remainder with chunk in successor base. */
-static void* prepend_alloc(mstate m, char* newbase, char* oldbase,
-                           size_t nb) {
-  mchunkptr p = align_as_chunk(newbase);
-  mchunkptr oldfirst = align_as_chunk(oldbase);
-  size_t psize = (char*)oldfirst - (char*)p;
-  mchunkptr q = chunk_plus_offset(p, nb);
-  size_t qsize = psize - nb;
-  set_size_and_pinuse_of_inuse_chunk(m, p, nb);
-
-  assert((char*)oldfirst > (char*)q);
-  assert(pinuse(oldfirst));
-  assert(qsize >= MIN_CHUNK_SIZE);
-
-  /* consolidate remainder with first chunk of old base */
-  if (oldfirst == m->top) {
-    size_t tsize = m->topsize += qsize;
-    m->top = q;
-    q->head = tsize | PINUSE_BIT;
-    check_top_chunk(m, q);
-  }
-  else if (oldfirst == m->dv) {
-    size_t dsize = m->dvsize += qsize;
-    m->dv = q;
-    set_size_and_pinuse_of_free_chunk(q, dsize);
-  }
-  else {
-    if (!is_inuse(oldfirst)) {
-      size_t nsize = chunksize(oldfirst);
-      unlink_chunk(m, oldfirst, nsize);
-      oldfirst = chunk_plus_offset(oldfirst, nsize);
-      qsize += nsize;
-    }
-    set_free_with_pinuse(q, qsize, oldfirst);
-    insert_chunk(m, q, qsize);
-    check_free_chunk(m, q);
-  }
-
-  check_malloced_chunk(m, chunk2mem(p), nb);
-  return chunk2mem(p);
-}
-
-/* Add a segment to hold a new noncontiguous region */
-static void add_segment(mstate m, char* tbase, size_t tsize, flag_t mmapped) {
-  /* Determine locations and sizes of segment, fenceposts, old top */
-  char* old_top = (char*)m->top;
-  msegmentptr oldsp = segment_holding(m, old_top);
-  char* old_end = oldsp->base + oldsp->size;
-  size_t ssize = pad_request(sizeof(struct malloc_segment));
-  char* rawsp = old_end - (ssize + FOUR_SIZE_T_SIZES + CHUNK_ALIGN_MASK);
-  size_t offset = align_offset(chunk2mem(rawsp));
-  char* asp = rawsp + offset;
-  char* csp = (asp < (old_top + MIN_CHUNK_SIZE))? old_top : asp;
-  mchunkptr sp = (mchunkptr)csp;
-  msegmentptr ss = (msegmentptr)(chunk2mem(sp));
-  mchunkptr tnext = chunk_plus_offset(sp, ssize);
-  mchunkptr p = tnext;
-  int nfences = 0;
-
-  /* reset top to new space */
-  init_top(m, (mchunkptr)tbase, tsize - TOP_FOOT_SIZE);
-
-  /* Set up segment record */
-  assert(is_aligned(ss));
-  set_size_and_pinuse_of_inuse_chunk(m, sp, ssize);
-  *ss = m->seg; /* Push current record */
-  m->seg.base = tbase;
-  m->seg.size = tsize;
-  m->seg.sflags = mmapped;
-  m->seg.next = ss;
-
-  /* Insert trailing fenceposts */
-  for (;;) {
-    mchunkptr nextp = chunk_plus_offset(p, SIZE_T_SIZE);
-    p->head = FENCEPOST_HEAD;
-    ++nfences;
-    if ((char*)(&(nextp->head)) < old_end)
-      p = nextp;
-    else
-      break;
-  }
-  assert(nfences >= 2);
-
-  /* Insert the rest of old top into a bin as an ordinary free chunk */
-  if (csp != old_top) {
-    mchunkptr q = (mchunkptr)old_top;
-    size_t psize = csp - old_top;
-    mchunkptr tn = chunk_plus_offset(q, psize);
-    set_free_with_pinuse(q, psize, tn);
-    insert_chunk(m, q, psize);
-  }
-
-  check_top_chunk(m, m->top);
-}
-
-/* -------------------------- System allocation -------------------------- */
-
-/* Get memory from system using MORECORE or MMAP */
-static void* sys_alloc(mstate m, size_t nb) {
-  char* tbase = CMFAIL;
-  size_t tsize = 0;
-  flag_t mmap_flag = 0;
-  size_t asize; /* allocation size */
-
-  ensure_initialization();
-
-  /* Directly map large chunks, but only if already initialized */
-  if (use_mmap(m) && nb >= mparams.mmap_threshold && m->topsize != 0) {
-    void* mem = mmap_alloc(m, nb);
-    if (mem != 0)
-      return mem;
-  }
-
-  asize = granularity_align(nb + SYS_ALLOC_PADDING);
-  if (asize <= nb)
-    return 0; /* wraparound */
-  if (m->footprint_limit != 0) {
-    size_t fp = m->footprint + asize;
-    if (fp <= m->footprint || fp > m->footprint_limit)
-      return 0;
-  }
-
-  /*
-    Try getting memory in any of three ways (in most-preferred to
-    least-preferred order):
-    1. A call to MORECORE that can normally contiguously extend memory.
-       (disabled if not MORECORE_CONTIGUOUS or not HAVE_MORECORE or
-       or main space is mmapped or a previous contiguous call failed)
-    2. A call to MMAP new space (disabled if not HAVE_MMAP).
-       Note that under the default settings, if MORECORE is unable to
-       fulfill a request, and HAVE_MMAP is true, then mmap is
-       used as a noncontiguous system allocator. This is a useful backup
-       strategy for systems with holes in address spaces -- in this case
-       sbrk cannot contiguously expand the heap, but mmap may be able to
-       find space.
-    3. A call to MORECORE that cannot usually contiguously extend memory.
-       (disabled if not HAVE_MORECORE)
-
-   In all cases, we need to request enough bytes from system to ensure
-   we can malloc nb bytes upon success, so pad with enough space for
-   top_foot, plus alignment-pad to make sure we don't lose bytes if
-   not on boundary, and round this up to a granularity unit.
-  */
-
-  if (MORECORE_CONTIGUOUS && !use_noncontiguous(m)) {
-    char* br = CMFAIL;
-    size_t ssize = asize; /* sbrk call size */
-    msegmentptr ss = (m->top == 0)? 0 : segment_holding(m, (char*)m->top);
-    ACQUIRE_MALLOC_GLOBAL_LOCK();
-
-    if (ss == 0) {  /* First time through or recovery */
-      char* base = (char*)CALL_MORECORE(0);
-      if (base != CMFAIL) {
-        size_t fp;
-        /* Adjust to end on a page boundary */
-        if (!is_page_aligned(base))
-          ssize += (page_align((size_t)base) - (size_t)base);
-        fp = m->footprint + ssize; /* recheck limits */
-        if (ssize > nb && ssize < HALF_MAX_SIZE_T &&
-            (m->footprint_limit == 0 ||
-             (fp > m->footprint && fp <= m->footprint_limit)) &&
-            (br = (char*)(CALL_MORECORE(ssize))) == base) {
-          tbase = base;
-          tsize = ssize;
-        }
-      }
-    }
-    else {
-      /* Subtract out existing available top space from MORECORE request. */
-      ssize = granularity_align(nb - m->topsize + SYS_ALLOC_PADDING);
-      /* Use mem here only if it did continuously extend old space */
-      if (ssize < HALF_MAX_SIZE_T &&
-          (br = (char*)(CALL_MORECORE(ssize))) == ss->base+ss->size) {
-        tbase = br;
-        tsize = ssize;
-      }
-    }
-
-    if (tbase == CMFAIL) {    /* Cope with partial failure */
-      if (br != CMFAIL) {    /* Try to use/extend the space we did get */
-        if (ssize < HALF_MAX_SIZE_T &&
-            ssize < nb + SYS_ALLOC_PADDING) {
-          size_t esize = granularity_align(nb + SYS_ALLOC_PADDING - ssize);
-          if (esize < HALF_MAX_SIZE_T) {
-            char* end = (char*)CALL_MORECORE(esize);
-            if (end != CMFAIL)
-              ssize += esize;
-            else {            /* Can't use; try to release */
-              (void) CALL_MORECORE(-ssize);
-              br = CMFAIL;
-            }
-          }
-        }
-      }
-      if (br != CMFAIL) {    /* Use the space we did get */
-        tbase = br;
-        tsize = ssize;
-      }
-      else
-        disable_contiguous(m); /* Don't try contiguous path in the future */
-    }
-
-    RELEASE_MALLOC_GLOBAL_LOCK();
-  }
-
-  if (HAVE_MMAP && tbase == CMFAIL) {  /* Try MMAP */
-    char* mp = (char*)(CALL_MMAP(asize));
-    if (mp != CMFAIL) {
-      tbase = mp;
-      tsize = asize;
-      mmap_flag = USE_MMAP_BIT;
-    }
-  }
-
-  if (HAVE_MORECORE && tbase == CMFAIL) { /* Try noncontiguous MORECORE */
-    if (asize < HALF_MAX_SIZE_T) {
-      char* br = CMFAIL;
-      char* end = CMFAIL;
-      ACQUIRE_MALLOC_GLOBAL_LOCK();
-      br = (char*)(CALL_MORECORE(asize));
-      end = (char*)(CALL_MORECORE(0));
-      RELEASE_MALLOC_GLOBAL_LOCK();
-      if (br != CMFAIL && end != CMFAIL && br < end) {
-        size_t ssize = end - br;
-        if (ssize > nb + TOP_FOOT_SIZE) {
-          tbase = br;
-          tsize = ssize;
-        }
-      }
-    }
-  }
-
-  if (tbase != CMFAIL) {
-
-    if ((m->footprint += tsize) > m->max_footprint)
-      m->max_footprint = m->footprint;
-
-    if (!is_initialized(m)) { /* first-time initialization */
-      if (m->least_addr == 0 || tbase < m->least_addr)
-        m->least_addr = tbase;
-      m->seg.base = tbase;
-      m->seg.size = tsize;
-      m->seg.sflags = mmap_flag;
-      m->magic = mparams.magic;
-      m->release_checks = MAX_RELEASE_CHECK_RATE;
-      init_bins(m);
-#if !ONLY_MSPACES
-      if (is_global(m))
-        init_top(m, (mchunkptr)tbase, tsize - TOP_FOOT_SIZE);
-      else
-#endif
-      {
-        /* Offset top by embedded malloc_state */
-        mchunkptr mn = next_chunk(mem2chunk(m));
-        init_top(m, mn, (size_t)((tbase + tsize) - (char*)mn) -TOP_FOOT_SIZE);
-      }
-    }
-
-    else {
-      /* Try to merge with an existing segment */
-      msegmentptr sp = &m->seg;
-      /* Only consider most recent segment if traversal suppressed */
-      while (sp != 0 && tbase != sp->base + sp->size)
-        sp = (NO_SEGMENT_TRAVERSAL) ? 0 : sp->next;
-      if (sp != 0 &&
-          !is_extern_segment(sp) &&
-          (sp->sflags & USE_MMAP_BIT) == mmap_flag &&
-          segment_holds(sp, m->top)) { /* append */
-        sp->size += tsize;
-        init_top(m, m->top, m->topsize + tsize);
-      }
-      else {
-        if (tbase < m->least_addr)
-          m->least_addr = tbase;
-        sp = &m->seg;
-        while (sp != 0 && sp->base != tbase + tsize)
-          sp = (NO_SEGMENT_TRAVERSAL) ? 0 : sp->next;
-        if (sp != 0 &&
-            !is_extern_segment(sp) &&
-            (sp->sflags & USE_MMAP_BIT) == mmap_flag) {
-          char* oldbase = sp->base;
-          sp->base = tbase;
-          sp->size += tsize;
-          return prepend_alloc(m, tbase, oldbase, nb);
-        }
-        else
-          add_segment(m, tbase, tsize, mmap_flag);
-      }
-    }
-
-    if (nb < m->topsize) { /* Allocate from new or extended top space */
-      size_t rsize = m->topsize -= nb;
-      mchunkptr p = m->top;
-      mchunkptr r = m->top = chunk_plus_offset(p, nb);
-      r->head = rsize | PINUSE_BIT;
-      set_size_and_pinuse_of_inuse_chunk(m, p, nb);
-      check_top_chunk(m, m->top);
-      check_malloced_chunk(m, chunk2mem(p), nb);
-      return chunk2mem(p);
-    }
-  }
-
-  MALLOC_FAILURE_ACTION;
-  return 0;
-}
-
-/* -----------------------  system deallocation -------------------------- */
-
-/* Unmap and unlink any mmapped segments that don't contain used chunks */
-static size_t release_unused_segments(mstate m) {
-  size_t released = 0;
-  int nsegs = 0;
-  msegmentptr pred = &m->seg;
-  msegmentptr sp = pred->next;
-  while (sp != 0) {
-    char* base = sp->base;
-    size_t size = sp->size;
-    msegmentptr next = sp->next;
-    ++nsegs;
-    if (is_mmapped_segment(sp) && !is_extern_segment(sp)) {
-      mchunkptr p = align_as_chunk(base);
-      size_t psize = chunksize(p);
-      /* Can unmap if first chunk holds entire segment and not pinned */
-      if (!is_inuse(p) && (char*)p + psize >= base + size - TOP_FOOT_SIZE) {
-        tchunkptr tp = (tchunkptr)p;
-        assert(segment_holds(sp, (char*)sp));
-        if (p == m->dv) {
-          m->dv = 0;
-          m->dvsize = 0;
-        }
-        else {
-          unlink_large_chunk(m, tp);
-        }
-        if (CALL_MUNMAP(base, size) == 0) {
-          released += size;
-          m->footprint -= size;
-          /* unlink obsoleted record */
-          sp = pred;
-          sp->next = next;
-        }
-        else { /* back out if cannot unmap */
-          insert_large_chunk(m, tp, psize);
-        }
-      }
-    }
-    if (NO_SEGMENT_TRAVERSAL) /* scan only first segment */
-      break;
-    pred = sp;
-    sp = next;
-  }
-  /* Reset check counter */
-  m->release_checks = (((size_t) nsegs > (size_t) MAX_RELEASE_CHECK_RATE)?
-                       (size_t) nsegs : (size_t) MAX_RELEASE_CHECK_RATE);
-  return released;
-}
-
-static int sys_trim(mstate m, size_t pad) {
-  size_t released = 0;
-  ensure_initialization();
-  if (pad < MAX_REQUEST && is_initialized(m)) {
-    pad += TOP_FOOT_SIZE; /* ensure enough room for segment overhead */
-
-    if (m->topsize > pad) {
-      /* Shrink top space in granularity-size units, keeping at least one */
-      size_t unit = mparams.granularity;
-      size_t extra = ((m->topsize - pad + (unit - SIZE_T_ONE)) / unit -
-                      SIZE_T_ONE) * unit;
-      msegmentptr sp = segment_holding(m, (char*)m->top);
-
-      if (!is_extern_segment(sp)) {
-        if (is_mmapped_segment(sp)) {
-          if (HAVE_MMAP &&
-              sp->size >= extra &&
-              !has_segment_link(m, sp)) { /* can't shrink if pinned */
-            size_t newsize = sp->size - extra;
-            (void)newsize; /* placate people compiling -Wunused-variable */
-            /* Prefer mremap, fall back to munmap */
-            if ((CALL_MREMAP(sp->base, sp->size, newsize, 0) != MFAIL) ||
-                (CALL_MUNMAP(sp->base + newsize, extra) == 0)) {
-              released = extra;
-            }
-          }
-        }
-        else if (HAVE_MORECORE) {
-          if (extra >= HALF_MAX_SIZE_T) /* Avoid wrapping negative */
-            extra = (HALF_MAX_SIZE_T) + SIZE_T_ONE - unit;
-          ACQUIRE_MALLOC_GLOBAL_LOCK();
-          {
-            /* Make sure end of memory is where we last set it. */
-            char* old_br = (char*)(CALL_MORECORE(0));
-            if (old_br == sp->base + sp->size) {
-              char* rel_br = (char*)(CALL_MORECORE(-extra));
-              char* new_br = (char*)(CALL_MORECORE(0));
-              if (rel_br != CMFAIL && new_br < old_br)
-                released = old_br - new_br;
-            }
-          }
-          RELEASE_MALLOC_GLOBAL_LOCK();
-        }
-      }
-
-      if (released != 0) {
-        sp->size -= released;
-        m->footprint -= released;
-        init_top(m, m->top, m->topsize - released);
-        check_top_chunk(m, m->top);
-      }
-    }
-
-    /* Unmap any unused mmapped segments */
-    if (HAVE_MMAP)
-      released += release_unused_segments(m);
-
-    /* On failure, disable autotrim to avoid repeated failed future calls */
-    if (released == 0 && m->topsize > m->trim_check)
-      m->trim_check = MAX_SIZE_T;
-  }
-
-  return (released != 0)? 1 : 0;
-}
-
-/* Consolidate and bin a chunk. Differs from exported versions
-   of free mainly in that the chunk need not be marked as inuse.
-*/
-static void dispose_chunk(mstate m, mchunkptr p, size_t psize) {
-  mchunkptr next = chunk_plus_offset(p, psize);
-  if (!pinuse(p)) {
-    mchunkptr prev;
-    size_t prevsize = p->prev_foot;
-    if (is_mmapped(p)) {
-      psize += prevsize + MMAP_FOOT_PAD;
-      if (CALL_MUNMAP((char*)p - prevsize, psize) == 0)
-        m->footprint -= psize;
-      return;
-    }
-    prev = chunk_minus_offset(p, prevsize);
-    psize += prevsize;
-    p = prev;
-    if (RTCHECK(ok_address(m, prev))) { /* consolidate backward */
-      if (p != m->dv) {
-        unlink_chunk(m, p, prevsize);
-      }
-      else if ((next->head & INUSE_BITS) == INUSE_BITS) {
-        m->dvsize = psize;
-        set_free_with_pinuse(p, psize, next);
-        return;
-      }
-    }
-    else {
-      CORRUPTION_ERROR_ACTION(m);
-      return;
-    }
-  }
-  if (RTCHECK(ok_address(m, next))) {
-    if (!cinuse(next)) {  /* consolidate forward */
-      if (next == m->top) {
-        size_t tsize = m->topsize += psize;
-        m->top = p;
-        p->head = tsize | PINUSE_BIT;
-        if (p == m->dv) {
-          m->dv = 0;
-          m->dvsize = 0;
-        }
-        return;
-      }
-      else if (next == m->dv) {
-        size_t dsize = m->dvsize += psize;
-        m->dv = p;
-        set_size_and_pinuse_of_free_chunk(p, dsize);
-        return;
-      }
-      else {
-        size_t nsize = chunksize(next);
-        psize += nsize;
-        unlink_chunk(m, next, nsize);
-        set_size_and_pinuse_of_free_chunk(p, psize);
-        if (p == m->dv) {
-          m->dvsize = psize;
-          return;
-        }
-      }
-    }
-    else {
-      set_free_with_pinuse(p, psize, next);
-    }
-    insert_chunk(m, p, psize);
-  }
-  else {
-    CORRUPTION_ERROR_ACTION(m);
-  }
-}
-
-/* ---------------------------- malloc --------------------------- */
-
-/* allocate a large request from the best fitting chunk in a treebin */
-static void* tmalloc_large(mstate m, size_t nb) {
-  tchunkptr v = 0;
-  size_t rsize = -nb; /* Unsigned negation */
-  tchunkptr t;
-  bindex_t idx;
-  compute_tree_index(nb, idx);
-  if ((t = *treebin_at(m, idx)) != 0) {
-    /* Traverse tree for this bin looking for node with size == nb */
-    size_t sizebits = nb << leftshift_for_tree_index(idx);
-    tchunkptr rst = 0;  /* The deepest untaken right subtree */
-    for (;;) {
-      tchunkptr rt;
-      size_t trem = chunksize(t) - nb;
-      if (trem < rsize) {
-        v = t;
-        if ((rsize = trem) == 0)
-          break;
-      }
-      rt = t->child[1];
-      t = t->child[(sizebits >> (SIZE_T_BITSIZE-SIZE_T_ONE)) & 1];
-      if (rt != 0 && rt != t)
-        rst = rt;
-      if (t == 0) {
-        t = rst; /* set t to least subtree holding sizes > nb */
-        break;
-      }
-      sizebits <<= 1;
-    }
-  }
-  if (t == 0 && v == 0) { /* set t to root of next non-empty treebin */
-    binmap_t leftbits = left_bits(idx2bit(idx)) & m->treemap;
-    if (leftbits != 0) {
-      bindex_t i;
-      binmap_t leastbit = least_bit(leftbits);
-      compute_bit2idx(leastbit, i);
-      t = *treebin_at(m, i);
-    }
-  }
-
-  while (t != 0) { /* find smallest of tree or subtree */
-    size_t trem = chunksize(t) - nb;
-    if (trem < rsize) {
-      rsize = trem;
-      v = t;
-    }
-    t = leftmost_child(t);
-  }
-
-  /*  If dv is a better fit, return 0 so malloc will use it */
-  if (v != 0 && rsize < (size_t)(m->dvsize - nb)) {
-    if (RTCHECK(ok_address(m, v))) { /* split */
-      mchunkptr r = chunk_plus_offset(v, nb);
-      assert(chunksize(v) == rsize + nb);
-      if (RTCHECK(ok_next(v, r))) {
-        unlink_large_chunk(m, v);
-        if (rsize < MIN_CHUNK_SIZE)
-          set_inuse_and_pinuse(m, v, (rsize + nb));
-        else {
-          set_size_and_pinuse_of_inuse_chunk(m, v, nb);
-          set_size_and_pinuse_of_free_chunk(r, rsize);
-          insert_chunk(m, r, rsize);
-        }
-        return chunk2mem(v);
-      }
-    }
-    CORRUPTION_ERROR_ACTION(m);
-  }
-  return 0;
-}
-
-/* allocate a small request from the best fitting chunk in a treebin */
-static void* tmalloc_small(mstate m, size_t nb) {
-  tchunkptr t, v;
-  size_t rsize;
-  bindex_t i;
-  binmap_t leastbit = least_bit(m->treemap);
-  compute_bit2idx(leastbit, i);
-  v = t = *treebin_at(m, i);
-  rsize = chunksize(t) - nb;
-
-  while ((t = leftmost_child(t)) != 0) {
-    size_t trem = chunksize(t) - nb;
-    if (trem < rsize) {
-      rsize = trem;
-      v = t;
-    }
-  }
-
-  if (RTCHECK(ok_address(m, v))) {
-    mchunkptr r = chunk_plus_offset(v, nb);
-    assert(chunksize(v) == rsize + nb);
-    if (RTCHECK(ok_next(v, r))) {
-      unlink_large_chunk(m, v);
-      if (rsize < MIN_CHUNK_SIZE)
-        set_inuse_and_pinuse(m, v, (rsize + nb));
-      else {
-        set_size_and_pinuse_of_inuse_chunk(m, v, nb);
-        set_size_and_pinuse_of_free_chunk(r, rsize);
-        replace_dv(m, r, rsize);
-      }
-      return chunk2mem(v);
-    }
-  }
-
-  CORRUPTION_ERROR_ACTION(m);
-  return 0;
-}
-
-#if !ONLY_MSPACES
-
-void* dlmalloc(size_t bytes) {
-  /*
-     Basic algorithm:
-     If a small request (< 256 bytes minus per-chunk overhead):
-       1. If one exists, use a remainderless chunk in associated smallbin.
-          (Remainderless means that there are too few excess bytes to
-          represent as a chunk.)
-       2. If it is big enough, use the dv chunk, which is normally the
-          chunk adjacent to the one used for the most recent small request.
-       3. If one exists, split the smallest available chunk in a bin,
-          saving remainder in dv.
-       4. If it is big enough, use the top chunk.
-       5. If available, get memory from system and use it
-     Otherwise, for a large request:
-       1. Find the smallest available binned chunk that fits, and use it
-          if it is better fitting than dv chunk, splitting if necessary.
-       2. If better fitting than any binned chunk, use the dv chunk.
-       3. If it is big enough, use the top chunk.
-       4. If request size >= mmap threshold, try to directly mmap this chunk.
-       5. If available, get memory from system and use it
-
-     The ugly goto's here ensure that postaction occurs along all paths.
-  */
-
-#if USE_LOCKS
-  ensure_initialization(); /* initialize in sys_alloc if not using locks */
-#endif
-
-  if (!PREACTION(gm)) {
-    void* mem;
-    size_t nb;
-    if (bytes <= MAX_SMALL_REQUEST) {
-      bindex_t idx;
-      binmap_t smallbits;
-      nb = (bytes < MIN_REQUEST)? MIN_CHUNK_SIZE : pad_request(bytes);
-      idx = small_index(nb);
-      smallbits = gm->smallmap >> idx;
-
-      if ((smallbits & 0x3U) != 0) { /* Remainderless fit to a smallbin. */
-        mchunkptr b, p;
-        idx += ~smallbits & 1;       /* Uses next bin if idx empty */
-        b = smallbin_at(gm, idx);
-        p = b->fd;
-        assert(chunksize(p) == small_index2size(idx));
-        unlink_first_small_chunk(gm, b, p, idx);
-        set_inuse_and_pinuse(gm, p, small_index2size(idx));
-        mem = chunk2mem(p);
-        check_malloced_chunk(gm, mem, nb);
-        goto postaction;
-      }
-
-      else if (nb > gm->dvsize) {
-        if (smallbits != 0) { /* Use chunk in next nonempty smallbin */
-          mchunkptr b, p, r;
-          size_t rsize;
-          bindex_t i;
-          binmap_t leftbits = (smallbits << idx) & left_bits(idx2bit(idx));
-          binmap_t leastbit = least_bit(leftbits);
-          compute_bit2idx(leastbit, i);
-          b = smallbin_at(gm, i);
-          p = b->fd;
-          assert(chunksize(p) == small_index2size(i));
-          unlink_first_small_chunk(gm, b, p, i);
-          rsize = small_index2size(i) - nb;
-          /* Fit here cannot be remainderless if 4byte sizes */
-          if (SIZE_T_SIZE != 4 && rsize < MIN_CHUNK_SIZE)
-            set_inuse_and_pinuse(gm, p, small_index2size(i));
-          else {
-            set_size_and_pinuse_of_inuse_chunk(gm, p, nb);
-            r = chunk_plus_offset(p, nb);
-            set_size_and_pinuse_of_free_chunk(r, rsize);
-            replace_dv(gm, r, rsize);
-          }
-          mem = chunk2mem(p);
-          check_malloced_chunk(gm, mem, nb);
-          goto postaction;
-        }
-
-        else if (gm->treemap != 0 && (mem = tmalloc_small(gm, nb)) != 0) {
-          check_malloced_chunk(gm, mem, nb);
-          goto postaction;
-        }
-      }
-    }
-    else if (bytes >= MAX_REQUEST)
-      nb = MAX_SIZE_T; /* Too big to allocate. Force failure (in sys alloc) */
-    else {
-      nb = pad_request(bytes);
-      if (gm->treemap != 0 && (mem = tmalloc_large(gm, nb)) != 0) {
-        check_malloced_chunk(gm, mem, nb);
-        goto postaction;
-      }
-    }
-
-    if (nb <= gm->dvsize) {
-      size_t rsize = gm->dvsize - nb;
-      mchunkptr p = gm->dv;
-      if (rsize >= MIN_CHUNK_SIZE) { /* split dv */
-        mchunkptr r = gm->dv = chunk_plus_offset(p, nb);
-        gm->dvsize = rsize;
-        set_size_and_pinuse_of_free_chunk(r, rsize);
-        set_size_and_pinuse_of_inuse_chunk(gm, p, nb);
-      }
-      else { /* exhaust dv */
-        size_t dvs = gm->dvsize;
-        gm->dvsize = 0;
-        gm->dv = 0;
-        set_inuse_and_pinuse(gm, p, dvs);
-      }
-      mem = chunk2mem(p);
-      check_malloced_chunk(gm, mem, nb);
-      goto postaction;
-    }
-
-    else if (nb < gm->topsize) { /* Split top */
-      size_t rsize = gm->topsize -= nb;
-      mchunkptr p = gm->top;
-      mchunkptr r = gm->top = chunk_plus_offset(p, nb);
-      r->head = rsize | PINUSE_BIT;
-      set_size_and_pinuse_of_inuse_chunk(gm, p, nb);
-      mem = chunk2mem(p);
-      check_top_chunk(gm, gm->top);
-      check_malloced_chunk(gm, mem, nb);
-      goto postaction;
-    }
-
-    mem = sys_alloc(gm, nb);
-
-  postaction:
-    POSTACTION(gm);
-    return mem;
-  }
-
-  return 0;
-}
-
-/* ---------------------------- free --------------------------- */
-
-void dlfree(void* mem) {
-  /*
-     Consolidate freed chunks with preceeding or succeeding bordering
-     free chunks, if they exist, and then place in a bin.  Intermixed
-     with special cases for top, dv, mmapped chunks, and usage errors.
-  */
-
-  if (mem != 0) {
-    mchunkptr p  = mem2chunk(mem);
-#if FOOTERS
-    mstate fm = get_mstate_for(p);
-    if (!ok_magic(fm)) {
-      USAGE_ERROR_ACTION(fm, p);
-      return;
-    }
-#else /* FOOTERS */
-#define fm gm
-#endif /* FOOTERS */
-    if (!PREACTION(fm)) {
-      check_inuse_chunk(fm, p);
-      if (RTCHECK(ok_address(fm, p) && ok_inuse(p))) {
-        size_t psize = chunksize(p);
-        mchunkptr next = chunk_plus_offset(p, psize);
-        if (!pinuse(p)) {
-          size_t prevsize = p->prev_foot;
-          if (is_mmapped(p)) {
-            psize += prevsize + MMAP_FOOT_PAD;
-            if (CALL_MUNMAP((char*)p - prevsize, psize) == 0)
-              fm->footprint -= psize;
-            goto postaction;
-          }
-          else {
-            mchunkptr prev = chunk_minus_offset(p, prevsize);
-            psize += prevsize;
-            p = prev;
-            if (RTCHECK(ok_address(fm, prev))) { /* consolidate backward */
-              if (p != fm->dv) {
-                unlink_chunk(fm, p, prevsize);
-              }
-              else if ((next->head & INUSE_BITS) == INUSE_BITS) {
-                fm->dvsize = psize;
-                set_free_with_pinuse(p, psize, next);
-                goto postaction;
-              }
-            }
-            else
-              goto erroraction;
-          }
-        }
-
-        if (RTCHECK(ok_next(p, next) && ok_pinuse(next))) {
-          if (!cinuse(next)) {  /* consolidate forward */
-            if (next == fm->top) {
-              size_t tsize = fm->topsize += psize;
-              fm->top = p;
-              p->head = tsize | PINUSE_BIT;
-              if (p == fm->dv) {
-                fm->dv = 0;
-                fm->dvsize = 0;
-              }
-              if (should_trim(fm, tsize))
-                sys_trim(fm, 0);
-              goto postaction;
-            }
-            else if (next == fm->dv) {
-              size_t dsize = fm->dvsize += psize;
-              fm->dv = p;
-              set_size_and_pinuse_of_free_chunk(p, dsize);
-              goto postaction;
-            }
-            else {
-              size_t nsize = chunksize(next);
-              psize += nsize;
-              unlink_chunk(fm, next, nsize);
-              set_size_and_pinuse_of_free_chunk(p, psize);
-              if (p == fm->dv) {
-                fm->dvsize = psize;
-                goto postaction;
-              }
-            }
-          }
-          else
-            set_free_with_pinuse(p, psize, next);
-
-          if (is_small(psize)) {
-            insert_small_chunk(fm, p, psize);
-            check_free_chunk(fm, p);
-          }
-          else {
-            tchunkptr tp = (tchunkptr)p;
-            insert_large_chunk(fm, tp, psize);
-            check_free_chunk(fm, p);
-            if (--fm->release_checks == 0)
-              release_unused_segments(fm);
-          }
-          goto postaction;
-        }
-      }
-    erroraction:
-      USAGE_ERROR_ACTION(fm, p);
-    postaction:
-      POSTACTION(fm);
-    }
-  }
-#if !FOOTERS
-#undef fm
-#endif /* FOOTERS */
-}
-
-void* dlcalloc(size_t n_elements, size_t elem_size) {
-  void* mem;
-  size_t req = 0;
-  if (n_elements != 0) {
-    req = n_elements * elem_size;
-    if (((n_elements | elem_size) & ~(size_t)0xffff) &&
-        (req / n_elements != elem_size))
-      req = MAX_SIZE_T; /* force downstream failure on overflow */
-  }
-  mem = dlmalloc(req);
-  if (mem != 0 && calloc_must_clear(mem2chunk(mem)))
-    memset(mem, 0, req);
-  return mem;
-}
-
-#endif /* !ONLY_MSPACES */
-
-/* ------------ Internal support for realloc, memalign, etc -------------- */
-
-/* Try to realloc; only in-place unless can_move true */
-static mchunkptr try_realloc_chunk(mstate m, mchunkptr p, size_t nb,
-                                   int can_move) {
-  mchunkptr newp = 0;
-  size_t oldsize = chunksize(p);
-  mchunkptr next = chunk_plus_offset(p, oldsize);
-  if (RTCHECK(ok_address(m, p) && ok_inuse(p) &&
-              ok_next(p, next) && ok_pinuse(next))) {
-    if (is_mmapped(p)) {
-      newp = mmap_resize(m, p, nb, can_move);
-    }
-    else if (oldsize >= nb) {             /* already big enough */
-      size_t rsize = oldsize - nb;
-      if (rsize >= MIN_CHUNK_SIZE) {      /* split off remainder */
-        mchunkptr r = chunk_plus_offset(p, nb);
-        set_inuse(m, p, nb);
-        set_inuse(m, r, rsize);
-        dispose_chunk(m, r, rsize);
-      }
-      newp = p;
-    }
-    else if (next == m->top) {  /* extend into top */
-      if (oldsize + m->topsize > nb) {
-        size_t newsize = oldsize + m->topsize;
-        size_t newtopsize = newsize - nb;
-        mchunkptr newtop = chunk_plus_offset(p, nb);
-        set_inuse(m, p, nb);
-        newtop->head = newtopsize |PINUSE_BIT;
-        m->top = newtop;
-        m->topsize = newtopsize;
-        newp = p;
-      }
-    }
-    else if (next == m->dv) { /* extend into dv */
-      size_t dvs = m->dvsize;
-      if (oldsize + dvs >= nb) {
-        size_t dsize = oldsize + dvs - nb;
-        if (dsize >= MIN_CHUNK_SIZE) {
-          mchunkptr r = chunk_plus_offset(p, nb);
-          mchunkptr n = chunk_plus_offset(r, dsize);
-          set_inuse(m, p, nb);
-          set_size_and_pinuse_of_free_chunk(r, dsize);
-          clear_pinuse(n);
-          m->dvsize = dsize;
-          m->dv = r;
-        }
-        else { /* exhaust dv */
-          size_t newsize = oldsize + dvs;
-          set_inuse(m, p, newsize);
-          m->dvsize = 0;
-          m->dv = 0;
-        }
-        newp = p;
-      }
-    }
-    else if (!cinuse(next)) { /* extend into next free chunk */
-      size_t nextsize = chunksize(next);
-      if (oldsize + nextsize >= nb) {
-        size_t rsize = oldsize + nextsize - nb;
-        unlink_chunk(m, next, nextsize);
-        if (rsize < MIN_CHUNK_SIZE) {
-          size_t newsize = oldsize + nextsize;
-          set_inuse(m, p, newsize);
-        }
-        else {
-          mchunkptr r = chunk_plus_offset(p, nb);
-          set_inuse(m, p, nb);
-          set_inuse(m, r, rsize);
-          dispose_chunk(m, r, rsize);
-        }
-        newp = p;
-      }
-    }
-  }
-  else {
-    USAGE_ERROR_ACTION(m, chunk2mem(p));
-  }
-  return newp;
-}
-
-static void* internal_memalign(mstate m, size_t alignment, size_t bytes) {
-  void* mem = 0;
-  if (alignment <  MIN_CHUNK_SIZE) /* must be at least a minimum chunk size */
-    alignment = MIN_CHUNK_SIZE;
-  if ((alignment & (alignment-SIZE_T_ONE)) != 0) {/* Ensure a power of 2 */
-    size_t a = MALLOC_ALIGNMENT << 1;
-    while (a < alignment) a <<= 1;
-    alignment = a;
-  }
-  if (bytes >= MAX_REQUEST - alignment) {
-    if (m != 0)  { /* Test isn't needed but avoids compiler warning */
-      MALLOC_FAILURE_ACTION;
-    }
-  }
-  else {
-    size_t nb = request2size(bytes);
-    size_t req = nb + alignment + MIN_CHUNK_SIZE - CHUNK_OVERHEAD;
-    mem = internal_malloc(m, req);
-    if (mem != 0) {
-      mchunkptr p = mem2chunk(mem);
-      if (PREACTION(m))
-        return 0;
-      if ((((size_t)(mem)) & (alignment - 1)) != 0) { /* misaligned */
-        /*
-          Find an aligned spot inside chunk.  Since we need to give
-          back leading space in a chunk of at least MIN_CHUNK_SIZE, if
-          the first calculation places us at a spot with less than
-          MIN_CHUNK_SIZE leader, we can move to the next aligned spot.
-          We've allocated enough total room so that this is always
-          possible.
-        */
-        char* br = (char*)mem2chunk((size_t)(((size_t)((char*)mem + alignment -
-                                                       SIZE_T_ONE)) &
-                                             -alignment));
-        char* pos = ((size_t)(br - (char*)(p)) >= MIN_CHUNK_SIZE)?
-          br : br+alignment;
-        mchunkptr newp = (mchunkptr)pos;
-        size_t leadsize = pos - (char*)(p);
-        size_t newsize = chunksize(p) - leadsize;
-
-        if (is_mmapped(p)) { /* For mmapped chunks, just adjust offset */
-          newp->prev_foot = p->prev_foot + leadsize;
-          newp->head = newsize;
-        }
-        else { /* Otherwise, give back leader, use the rest */
-          set_inuse(m, newp, newsize);
-          set_inuse(m, p, leadsize);
-          dispose_chunk(m, p, leadsize);
-        }
-        p = newp;
-      }
-
-      /* Give back spare room at the end */
-      if (!is_mmapped(p)) {
-        size_t size = chunksize(p);
-        if (size > nb + MIN_CHUNK_SIZE) {
-          size_t remainder_size = size - nb;
-          mchunkptr remainder = chunk_plus_offset(p, nb);
-          set_inuse(m, p, nb);
-          set_inuse(m, remainder, remainder_size);
-          dispose_chunk(m, remainder, remainder_size);
-        }
-      }
-
-      mem = chunk2mem(p);
-      assert (chunksize(p) >= nb);
-      assert(((size_t)mem & (alignment - 1)) == 0);
-      check_inuse_chunk(m, p);
-      POSTACTION(m);
-    }
-  }
-  return mem;
-}
-
-/*
-  Common support for independent_X routines, handling
-    all of the combinations that can result.
-  The opts arg has:
-    bit 0 set if all elements are same size (using sizes[0])
-    bit 1 set if elements should be zeroed
-*/
-static void** ialloc(mstate m,
-                     size_t n_elements,
-                     size_t* sizes,
-                     int opts,
-                     void* chunks[]) {
-
-  size_t    element_size;   /* chunksize of each element, if all same */
-  size_t    contents_size;  /* total size of elements */
-  size_t    array_size;     /* request size of pointer array */
-  void*     mem;            /* malloced aggregate space */
-  mchunkptr p;              /* corresponding chunk */
-  size_t    remainder_size; /* remaining bytes while splitting */
-  void**    marray;         /* either "chunks" or malloced ptr array */
-  mchunkptr array_chunk;    /* chunk for malloced ptr array */
-  flag_t    was_enabled;    /* to disable mmap */
-  size_t    size;
-  size_t    i;
-
-  ensure_initialization();
-  /* compute array length, if needed */
-  if (chunks != 0) {
-    if (n_elements == 0)
-      return chunks; /* nothing to do */
-    marray = chunks;
-    array_size = 0;
-  }
-  else {
-    /* if empty req, must still return chunk representing empty array */
-    if (n_elements == 0)
-      return (void**)internal_malloc(m, 0);
-    marray = 0;
-    array_size = request2size(n_elements * (sizeof(void*)));
-  }
-
-  /* compute total element size */
-  if (opts & 0x1) { /* all-same-size */
-    element_size = request2size(*sizes);
-    contents_size = n_elements * element_size;
-  }
-  else { /* add up all the sizes */
-    element_size = 0;
-    contents_size = 0;
-    for (i = 0; i != n_elements; ++i)
-      contents_size += request2size(sizes[i]);
-  }
-
-  size = contents_size + array_size;
-
-  /*
-     Allocate the aggregate chunk.  First disable direct-mmapping so
-     malloc won't use it, since we would not be able to later
-     free/realloc space internal to a segregated mmap region.
-  */
-  was_enabled = use_mmap(m);
-  disable_mmap(m);
-  mem = internal_malloc(m, size - CHUNK_OVERHEAD);
-  if (was_enabled)
-    enable_mmap(m);
-  if (mem == 0)
-    return 0;
-
-  if (PREACTION(m)) return 0;
-  p = mem2chunk(mem);
-  remainder_size = chunksize(p);
-
-  assert(!is_mmapped(p));
-
-  if (opts & 0x2) {       /* optionally clear the elements */
-    memset((size_t*)mem, 0, remainder_size - SIZE_T_SIZE - array_size);
-  }
-
-  /* If not provided, allocate the pointer array as final part of chunk */
-  if (marray == 0) {
-    size_t  array_chunk_size;
-    array_chunk = chunk_plus_offset(p, contents_size);
-    array_chunk_size = remainder_size - contents_size;
-    marray = (void**) (chunk2mem(array_chunk));
-    set_size_and_pinuse_of_inuse_chunk(m, array_chunk, array_chunk_size);
-    remainder_size = contents_size;
-  }
-
-  /* split out elements */
-  for (i = 0; ; ++i) {
-    marray[i] = chunk2mem(p);
-    if (i != n_elements-1) {
-      if (element_size != 0)
-        size = element_size;
-      else
-        size = request2size(sizes[i]);
-      remainder_size -= size;
-      set_size_and_pinuse_of_inuse_chunk(m, p, size);
-      p = chunk_plus_offset(p, size);
-    }
-    else { /* the final element absorbs any overallocation slop */
-      set_size_and_pinuse_of_inuse_chunk(m, p, remainder_size);
-      break;
-    }
-  }
-
-#if DEBUG
-  if (marray != chunks) {
-    /* final element must have exactly exhausted chunk */
-    if (element_size != 0) {
-      assert(remainder_size == element_size);
-    }
-    else {
-      assert(remainder_size == request2size(sizes[i]));
-    }
-    check_inuse_chunk(m, mem2chunk(marray));
-  }
-  for (i = 0; i != n_elements; ++i)
-    check_inuse_chunk(m, mem2chunk(marray[i]));
-
-#endif /* DEBUG */
-
-  POSTACTION(m);
-  return marray;
-}
-
-/* Try to free all pointers in the given array.
-   Note: this could be made faster, by delaying consolidation,
-   at the price of disabling some user integrity checks, We
-   still optimize some consolidations by combining adjacent
-   chunks before freeing, which will occur often if allocated
-   with ialloc or the array is sorted.
-*/
-static size_t internal_bulk_free(mstate m, void* array[], size_t nelem) {
-  size_t unfreed = 0;
-  if (!PREACTION(m)) {
-    void** a;
-    void** fence = &(array[nelem]);
-    for (a = array; a != fence; ++a) {
-      void* mem = *a;
-      if (mem != 0) {
-        mchunkptr p = mem2chunk(mem);
-        size_t psize = chunksize(p);
-#if FOOTERS
-        if (get_mstate_for(p) != m) {
-          ++unfreed;
-          continue;
-        }
-#endif
-        check_inuse_chunk(m, p);
-        *a = 0;
-        if (RTCHECK(ok_address(m, p) && ok_inuse(p))) {
-          void ** b = a + 1; /* try to merge with next chunk */
-          mchunkptr next = next_chunk(p);
-          if (b != fence && *b == chunk2mem(next)) {
-            size_t newsize = chunksize(next) + psize;
-            set_inuse(m, p, newsize);
-            *b = chunk2mem(p);
-          }
-          else
-            dispose_chunk(m, p, psize);
-        }
-        else {
-          CORRUPTION_ERROR_ACTION(m);
-          break;
-        }
-      }
-    }
-    if (should_trim(m, m->topsize))
-      sys_trim(m, 0);
-    POSTACTION(m);
-  }
-  return unfreed;
-}
-
-/* Traversal */
-#if MALLOC_INSPECT_ALL
-static void internal_inspect_all(mstate m,
-                                 void(*handler)(void *start,
-                                                void *end,
-                                                size_t used_bytes,
-                                                void* callback_arg),
-                                 void* arg) {
-  if (is_initialized(m)) {
-    mchunkptr top = m->top;
-    msegmentptr s;
-    for (s = &m->seg; s != 0; s = s->next) {
-      mchunkptr q = align_as_chunk(s->base);
-      while (segment_holds(s, q) && q->head != FENCEPOST_HEAD) {
-        mchunkptr next = next_chunk(q);
-        size_t sz = chunksize(q);
-        size_t used;
-        void* start;
-        if (is_inuse(q)) {
-          used = sz - CHUNK_OVERHEAD; /* must not be mmapped */
-          start = chunk2mem(q);
-        }
-        else {
-          used = 0;
-          if (is_small(sz)) {     /* offset by possible bookkeeping */
-            start = (void*)((char*)q + sizeof(struct malloc_chunk));
-          }
-          else {
-            start = (void*)((char*)q + sizeof(struct malloc_tree_chunk));
-          }
-        }
-        if (start < (void*)next)  /* skip if all space is bookkeeping */
-          handler(start, next, used, arg);
-        if (q == top)
-          break;
-        q = next;
-      }
-    }
-  }
-}
-#endif /* MALLOC_INSPECT_ALL */
-
-/* ------------------ Exported realloc, memalign, etc -------------------- */
-
-#if !ONLY_MSPACES
-
-void* dlrealloc(void* oldmem, size_t bytes) {
-  void* mem = 0;
-  if (oldmem == 0) {
-    mem = dlmalloc(bytes);
-  }
-  else if (bytes >= MAX_REQUEST) {
-    MALLOC_FAILURE_ACTION;
-  }
-#ifdef REALLOC_ZERO_BYTES_FREES
-  else if (bytes == 0) {
-    dlfree(oldmem);
-  }
-#endif /* REALLOC_ZERO_BYTES_FREES */
-  else {
-    size_t nb = request2size(bytes);
-    mchunkptr oldp = mem2chunk(oldmem);
-#if ! FOOTERS
-    mstate m = gm;
-#else /* FOOTERS */
-    mstate m = get_mstate_for(oldp);
-    if (!ok_magic(m)) {
-      USAGE_ERROR_ACTION(m, oldmem);
-      return 0;
-    }
-#endif /* FOOTERS */
-    if (!PREACTION(m)) {
-      mchunkptr newp = try_realloc_chunk(m, oldp, nb, 1);
-      POSTACTION(m);
-      if (newp != 0) {
-        check_inuse_chunk(m, newp);
-        mem = chunk2mem(newp);
-      }
-      else {
-        mem = internal_malloc(m, bytes);
-        if (mem != 0) {
-          size_t oc = chunksize(oldp) - overhead_for(oldp);
-          memcpy(mem, oldmem, (oc < bytes)? oc : bytes);
-          internal_free(m, oldmem);
-        }
-      }
-    }
-  }
-  return mem;
-}
-
-void* dlrealloc_in_place(void* oldmem, size_t bytes) {
-  void* mem = 0;
-  if (oldmem != 0) {
-    if (bytes >= MAX_REQUEST) {
-      MALLOC_FAILURE_ACTION;
-    }
-    else {
-      size_t nb = request2size(bytes);
-      mchunkptr oldp = mem2chunk(oldmem);
-#if ! FOOTERS
-      mstate m = gm;
-#else /* FOOTERS */
-      mstate m = get_mstate_for(oldp);
-      if (!ok_magic(m)) {
-        USAGE_ERROR_ACTION(m, oldmem);
-        return 0;
-      }
-#endif /* FOOTERS */
-      if (!PREACTION(m)) {
-        mchunkptr newp = try_realloc_chunk(m, oldp, nb, 0);
-        POSTACTION(m);
-        if (newp == oldp) {
-          check_inuse_chunk(m, newp);
-          mem = oldmem;
-        }
-      }
-    }
-  }
-  return mem;
-}
-
-void* dlmemalign(size_t alignment, size_t bytes) {
-  if (alignment <= MALLOC_ALIGNMENT) {
-    return dlmalloc(bytes);
-  }
-  return internal_memalign(gm, alignment, bytes);
-}
-
-int dlposix_memalign(void** pp, size_t alignment, size_t bytes) {
-  void* mem = 0;
-  if (alignment == MALLOC_ALIGNMENT)
-    mem = dlmalloc(bytes);
-  else {
-    size_t d = alignment / sizeof(void*);
-    size_t r = alignment % sizeof(void*);
-    if (r != 0 || d == 0 || (d & (d-SIZE_T_ONE)) != 0)
-      return EINVAL;
-    else if (bytes <= MAX_REQUEST - alignment) {
-      if (alignment <  MIN_CHUNK_SIZE)
-        alignment = MIN_CHUNK_SIZE;
-      mem = internal_memalign(gm, alignment, bytes);
-    }
-  }
-  if (mem == 0)
-    return ENOMEM;
-  else {
-    *pp = mem;
-    return 0;
-  }
-}
-
-void* dlvalloc(size_t bytes) {
-  size_t pagesz;
-  ensure_initialization();
-  pagesz = mparams.page_size;
-  return dlmemalign(pagesz, bytes);
-}
-
-void* dlpvalloc(size_t bytes) {
-  size_t pagesz;
-  ensure_initialization();
-  pagesz = mparams.page_size;
-  return dlmemalign(pagesz, (bytes + pagesz - SIZE_T_ONE) & ~(pagesz - SIZE_T_ONE));
-}
-
-void** dlindependent_calloc(size_t n_elements, size_t elem_size,
-                            void* chunks[]) {
-  size_t sz = elem_size; /* serves as 1-element array */
-  return ialloc(gm, n_elements, &sz, 3, chunks);
-}
-
-void** dlindependent_comalloc(size_t n_elements, size_t sizes[],
-                              void* chunks[]) {
-  return ialloc(gm, n_elements, sizes, 0, chunks);
-}
-
-size_t dlbulk_free(void* array[], size_t nelem) {
-  return internal_bulk_free(gm, array, nelem);
-}
-
-#if MALLOC_INSPECT_ALL
-void dlmalloc_inspect_all(void(*handler)(void *start,
-                                         void *end,
-                                         size_t used_bytes,
-                                         void* callback_arg),
-                          void* arg) {
-  ensure_initialization();
-  if (!PREACTION(gm)) {
-    internal_inspect_all(gm, handler, arg);
-    POSTACTION(gm);
-  }
-}
-#endif /* MALLOC_INSPECT_ALL */
-
-int dlmalloc_trim(size_t pad) {
-  int result = 0;
-  ensure_initialization();
-  if (!PREACTION(gm)) {
-    result = sys_trim(gm, pad);
-    POSTACTION(gm);
-  }
-  return result;
-}
-
-size_t dlmalloc_footprint(void) {
-  return gm->footprint;
-}
-
-size_t dlmalloc_max_footprint(void) {
-  return gm->max_footprint;
-}
-
-size_t dlmalloc_footprint_limit(void) {
-  size_t maf = gm->footprint_limit;
-  return maf == 0 ? MAX_SIZE_T : maf;
-}
-
-size_t dlmalloc_set_footprint_limit(size_t bytes) {
-  ensure_initialization();
-  size_t result;  /* invert sense of 0 */
-  if (bytes == 0)
-    result = granularity_align(1); /* Use minimal size */
-  if (bytes == MAX_SIZE_T)
-    result = 0;                    /* disable */
-  else
-    result = granularity_align(bytes);
-  return gm->footprint_limit = result;
-}
-
-#if !NO_MALLINFO
-struct mallinfo dlmallinfo(void) {
-  return internal_mallinfo(gm);
-}
-#endif /* NO_MALLINFO */
-
-#if !NO_MALLOC_STATS
-void dlmalloc_stats() {
-  internal_malloc_stats(gm);
-}
-#endif /* NO_MALLOC_STATS */
-
-int dlmallopt(int param_number, int value) {
-  return change_mparam(param_number, value);
-}
-
-size_t dlmalloc_usable_size(void* mem) {
-  if (mem != 0) {
-    mchunkptr p = mem2chunk(mem);
-    if (is_inuse(p))
-      return chunksize(p) - overhead_for(p);
-  }
-  return 0;
-}
-
-#endif /* !ONLY_MSPACES */
-
-/* ----------------------------- user mspaces ---------------------------- */
-
-#if MSPACES
-
-static mstate init_user_mstate(char* tbase, size_t tsize) {
-  size_t msize = pad_request(sizeof(struct malloc_state));
-  mchunkptr mn;
-  mchunkptr msp = align_as_chunk(tbase);
-  mstate m = (mstate)(chunk2mem(msp));
-  memset(m, 0, msize);
-  (void)INITIAL_LOCK(&m->mutex);
-  msp->head = (msize|INUSE_BITS);
-  m->seg.base = m->least_addr = tbase;
-  m->seg.size = m->footprint = m->max_footprint = tsize;
-  m->magic = mparams.magic;
-  m->release_checks = MAX_RELEASE_CHECK_RATE;
-  m->mflags = mparams.default_mflags;
-  m->extp = 0;
-  m->exts = 0;
-  disable_contiguous(m);
-  init_bins(m);
-  mn = next_chunk(mem2chunk(m));
-  init_top(m, mn, (size_t)((tbase + tsize) - (char*)mn) - TOP_FOOT_SIZE);
-  check_top_chunk(m, m->top);
-  return m;
-}
-
-mspace create_mspace(size_t capacity, int locked) {
-  mstate m = 0;
-  size_t msize;
-  ensure_initialization();
-  msize = pad_request(sizeof(struct malloc_state));
-  if (capacity < (size_t) -(msize + TOP_FOOT_SIZE + mparams.page_size)) {
-    size_t rs = ((capacity == 0)? mparams.granularity :
-                 (capacity + TOP_FOOT_SIZE + msize));
-    size_t tsize = granularity_align(rs);
-    char* tbase = (char*)(CALL_MMAP(tsize));
-    if (tbase != CMFAIL) {
-      m = init_user_mstate(tbase, tsize);
-      m->seg.sflags = USE_MMAP_BIT;
-      set_lock(m, locked);
-    }
-  }
-  return (mspace)m;
-}
-
-mspace create_mspace_with_base(void* base, size_t capacity, int locked) {
-  mstate m = 0;
-  size_t msize;
-  ensure_initialization();
-  msize = pad_request(sizeof(struct malloc_state));
-  if (capacity > msize + TOP_FOOT_SIZE &&
-      capacity < (size_t) -(msize + TOP_FOOT_SIZE + mparams.page_size)) {
-    m = init_user_mstate((char*)base, capacity);
-    m->seg.sflags = EXTERN_BIT;
-    set_lock(m, locked);
-  }
-  return (mspace)m;
-}
-
-int mspace_track_large_chunks(mspace msp, int enable) {
-  int ret = 0;
-  mstate ms = (mstate)msp;
-  if (!PREACTION(ms)) {
-    if (!use_mmap(ms)) {
-      ret = 1;
-    }
-    if (!enable) {
-      enable_mmap(ms);
-    } else {
-      disable_mmap(ms);
-    }
-    POSTACTION(ms);
-  }
-  return ret;
-}
-
-size_t destroy_mspace(mspace msp) {
-  size_t freed = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    msegmentptr sp = &ms->seg;
-    (void)DESTROY_LOCK(&ms->mutex); /* destroy before unmapped */
-    while (sp != 0) {
-      char* base = sp->base;
-      size_t size = sp->size;
-      flag_t flag = sp->sflags;
-      (void)base; /* placate people compiling -Wunused-variable */
-      sp = sp->next;
-      if ((flag & USE_MMAP_BIT) && !(flag & EXTERN_BIT) &&
-          CALL_MUNMAP(base, size) == 0)
-        freed += size;
-    }
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return freed;
-}
-
-/*
-  mspace versions of routines are near-clones of the global
-  versions. This is not so nice but better than the alternatives.
-*/
-
-void* mspace_malloc(mspace msp, size_t bytes) {
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-    return 0;
-  }
-  if (!PREACTION(ms)) {
-    void* mem;
-    size_t nb;
-    if (bytes <= MAX_SMALL_REQUEST) {
-      bindex_t idx;
-      binmap_t smallbits;
-      nb = (bytes < MIN_REQUEST)? MIN_CHUNK_SIZE : pad_request(bytes);
-      idx = small_index(nb);
-      smallbits = ms->smallmap >> idx;
-
-      if ((smallbits & 0x3U) != 0) { /* Remainderless fit to a smallbin. */
-        mchunkptr b, p;
-        idx += ~smallbits & 1;       /* Uses next bin if idx empty */
-        b = smallbin_at(ms, idx);
-        p = b->fd;
-        assert(chunksize(p) == small_index2size(idx));
-        unlink_first_small_chunk(ms, b, p, idx);
-        set_inuse_and_pinuse(ms, p, small_index2size(idx));
-        mem = chunk2mem(p);
-        check_malloced_chunk(ms, mem, nb);
-        goto postaction;
-      }
-
-      else if (nb > ms->dvsize) {
-        if (smallbits != 0) { /* Use chunk in next nonempty smallbin */
-          mchunkptr b, p, r;
-          size_t rsize;
-          bindex_t i;
-          binmap_t leftbits = (smallbits << idx) & left_bits(idx2bit(idx));
-          binmap_t leastbit = least_bit(leftbits);
-          compute_bit2idx(leastbit, i);
-          b = smallbin_at(ms, i);
-          p = b->fd;
-          assert(chunksize(p) == small_index2size(i));
-          unlink_first_small_chunk(ms, b, p, i);
-          rsize = small_index2size(i) - nb;
-          /* Fit here cannot be remainderless if 4byte sizes */
-          if (SIZE_T_SIZE != 4 && rsize < MIN_CHUNK_SIZE)
-            set_inuse_and_pinuse(ms, p, small_index2size(i));
-          else {
-            set_size_and_pinuse_of_inuse_chunk(ms, p, nb);
-            r = chunk_plus_offset(p, nb);
-            set_size_and_pinuse_of_free_chunk(r, rsize);
-            replace_dv(ms, r, rsize);
-          }
-          mem = chunk2mem(p);
-          check_malloced_chunk(ms, mem, nb);
-          goto postaction;
-        }
-
-        else if (ms->treemap != 0 && (mem = tmalloc_small(ms, nb)) != 0) {
-          check_malloced_chunk(ms, mem, nb);
-          goto postaction;
-        }
-      }
-    }
-    else if (bytes >= MAX_REQUEST)
-      nb = MAX_SIZE_T; /* Too big to allocate. Force failure (in sys alloc) */
-    else {
-      nb = pad_request(bytes);
-      if (ms->treemap != 0 && (mem = tmalloc_large(ms, nb)) != 0) {
-        check_malloced_chunk(ms, mem, nb);
-        goto postaction;
-      }
-    }
-
-    if (nb <= ms->dvsize) {
-      size_t rsize = ms->dvsize - nb;
-      mchunkptr p = ms->dv;
-      if (rsize >= MIN_CHUNK_SIZE) { /* split dv */
-        mchunkptr r = ms->dv = chunk_plus_offset(p, nb);
-        ms->dvsize = rsize;
-        set_size_and_pinuse_of_free_chunk(r, rsize);
-        set_size_and_pinuse_of_inuse_chunk(ms, p, nb);
-      }
-      else { /* exhaust dv */
-        size_t dvs = ms->dvsize;
-        ms->dvsize = 0;
-        ms->dv = 0;
-        set_inuse_and_pinuse(ms, p, dvs);
-      }
-      mem = chunk2mem(p);
-      check_malloced_chunk(ms, mem, nb);
-      goto postaction;
-    }
-
-    else if (nb < ms->topsize) { /* Split top */
-      size_t rsize = ms->topsize -= nb;
-      mchunkptr p = ms->top;
-      mchunkptr r = ms->top = chunk_plus_offset(p, nb);
-      r->head = rsize | PINUSE_BIT;
-      set_size_and_pinuse_of_inuse_chunk(ms, p, nb);
-      mem = chunk2mem(p);
-      check_top_chunk(ms, ms->top);
-      check_malloced_chunk(ms, mem, nb);
-      goto postaction;
-    }
-
-    mem = sys_alloc(ms, nb);
-
-  postaction:
-    POSTACTION(ms);
-    return mem;
-  }
-
-  return 0;
-}
-
-void mspace_free(mspace msp, void* mem) {
-  if (mem != 0) {
-    mchunkptr p  = mem2chunk(mem);
-#if FOOTERS
-    mstate fm = get_mstate_for(p);
-    (void)msp; /* placate people compiling -Wunused */
-#else /* FOOTERS */
-    mstate fm = (mstate)msp;
-#endif /* FOOTERS */
-    if (!ok_magic(fm)) {
-      USAGE_ERROR_ACTION(fm, p);
-      return;
-    }
-    if (!PREACTION(fm)) {
-      check_inuse_chunk(fm, p);
-      if (RTCHECK(ok_address(fm, p) && ok_inuse(p))) {
-        size_t psize = chunksize(p);
-        mchunkptr next = chunk_plus_offset(p, psize);
-        if (!pinuse(p)) {
-          size_t prevsize = p->prev_foot;
-          if (is_mmapped(p)) {
-            psize += prevsize + MMAP_FOOT_PAD;
-            if (CALL_MUNMAP((char*)p - prevsize, psize) == 0)
-              fm->footprint -= psize;
-            goto postaction;
-          }
-          else {
-            mchunkptr prev = chunk_minus_offset(p, prevsize);
-            psize += prevsize;
-            p = prev;
-            if (RTCHECK(ok_address(fm, prev))) { /* consolidate backward */
-              if (p != fm->dv) {
-                unlink_chunk(fm, p, prevsize);
-              }
-              else if ((next->head & INUSE_BITS) == INUSE_BITS) {
-                fm->dvsize = psize;
-                set_free_with_pinuse(p, psize, next);
-                goto postaction;
-              }
-            }
-            else
-              goto erroraction;
-          }
-        }
-
-        if (RTCHECK(ok_next(p, next) && ok_pinuse(next))) {
-          if (!cinuse(next)) {  /* consolidate forward */
-            if (next == fm->top) {
-              size_t tsize = fm->topsize += psize;
-              fm->top = p;
-              p->head = tsize | PINUSE_BIT;
-              if (p == fm->dv) {
-                fm->dv = 0;
-                fm->dvsize = 0;
-              }
-              if (should_trim(fm, tsize))
-                sys_trim(fm, 0);
-              goto postaction;
-            }
-            else if (next == fm->dv) {
-              size_t dsize = fm->dvsize += psize;
-              fm->dv = p;
-              set_size_and_pinuse_of_free_chunk(p, dsize);
-              goto postaction;
-            }
-            else {
-              size_t nsize = chunksize(next);
-              psize += nsize;
-              unlink_chunk(fm, next, nsize);
-              set_size_and_pinuse_of_free_chunk(p, psize);
-              if (p == fm->dv) {
-                fm->dvsize = psize;
-                goto postaction;
-              }
-            }
-          }
-          else
-            set_free_with_pinuse(p, psize, next);
-
-          if (is_small(psize)) {
-            insert_small_chunk(fm, p, psize);
-            check_free_chunk(fm, p);
-          }
-          else {
-            tchunkptr tp = (tchunkptr)p;
-            insert_large_chunk(fm, tp, psize);
-            check_free_chunk(fm, p);
-            if (--fm->release_checks == 0)
-              release_unused_segments(fm);
-          }
-          goto postaction;
-        }
-      }
-    erroraction:
-      USAGE_ERROR_ACTION(fm, p);
-    postaction:
-      POSTACTION(fm);
-    }
-  }
-}
-
-void* mspace_calloc(mspace msp, size_t n_elements, size_t elem_size) {
-  void* mem;
-  size_t req = 0;
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-    return 0;
-  }
-  if (n_elements != 0) {
-    req = n_elements * elem_size;
-    if (((n_elements | elem_size) & ~(size_t)0xffff) &&
-        (req / n_elements != elem_size))
-      req = MAX_SIZE_T; /* force downstream failure on overflow */
-  }
-  mem = internal_malloc(ms, req);
-  if (mem != 0 && calloc_must_clear(mem2chunk(mem)))
-    memset(mem, 0, req);
-  return mem;
-}
-
-void* mspace_realloc(mspace msp, void* oldmem, size_t bytes) {
-  void* mem = 0;
-  if (oldmem == 0) {
-    mem = mspace_malloc(msp, bytes);
-  }
-  else if (bytes >= MAX_REQUEST) {
-    MALLOC_FAILURE_ACTION;
-  }
-#ifdef REALLOC_ZERO_BYTES_FREES
-  else if (bytes == 0) {
-    mspace_free(msp, oldmem);
-  }
-#endif /* REALLOC_ZERO_BYTES_FREES */
-  else {
-    size_t nb = request2size(bytes);
-    mchunkptr oldp = mem2chunk(oldmem);
-#if ! FOOTERS
-    mstate m = (mstate)msp;
-#else /* FOOTERS */
-    mstate m = get_mstate_for(oldp);
-    if (!ok_magic(m)) {
-      USAGE_ERROR_ACTION(m, oldmem);
-      return 0;
-    }
-#endif /* FOOTERS */
-    if (!PREACTION(m)) {
-      mchunkptr newp = try_realloc_chunk(m, oldp, nb, 1);
-      POSTACTION(m);
-      if (newp != 0) {
-        check_inuse_chunk(m, newp);
-        mem = chunk2mem(newp);
-      }
-      else {
-        mem = mspace_malloc(m, bytes);
-        if (mem != 0) {
-          size_t oc = chunksize(oldp) - overhead_for(oldp);
-          memcpy(mem, oldmem, (oc < bytes)? oc : bytes);
-          mspace_free(m, oldmem);
-        }
-      }
-    }
-  }
-  return mem;
-}
-
-void* mspace_realloc_in_place(mspace msp, void* oldmem, size_t bytes) {
-  void* mem = 0;
-  if (oldmem != 0) {
-    if (bytes >= MAX_REQUEST) {
-      MALLOC_FAILURE_ACTION;
-    }
-    else {
-      size_t nb = request2size(bytes);
-      mchunkptr oldp = mem2chunk(oldmem);
-#if ! FOOTERS
-      mstate m = (mstate)msp;
-#else /* FOOTERS */
-      mstate m = get_mstate_for(oldp);
-      (void)msp; /* placate people compiling -Wunused */
-      if (!ok_magic(m)) {
-        USAGE_ERROR_ACTION(m, oldmem);
-        return 0;
-      }
-#endif /* FOOTERS */
-      if (!PREACTION(m)) {
-        mchunkptr newp = try_realloc_chunk(m, oldp, nb, 0);
-        POSTACTION(m);
-        if (newp == oldp) {
-          check_inuse_chunk(m, newp);
-          mem = oldmem;
-        }
-      }
-    }
-  }
-  return mem;
-}
-
-void* mspace_memalign(mspace msp, size_t alignment, size_t bytes) {
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-    return 0;
-  }
-  if (alignment <= MALLOC_ALIGNMENT)
-    return mspace_malloc(msp, bytes);
-  return internal_memalign(ms, alignment, bytes);
-}
-
-void** mspace_independent_calloc(mspace msp, size_t n_elements,
-                                 size_t elem_size, void* chunks[]) {
-  size_t sz = elem_size; /* serves as 1-element array */
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-    return 0;
-  }
-  return ialloc(ms, n_elements, &sz, 3, chunks);
-}
-
-void** mspace_independent_comalloc(mspace msp, size_t n_elements,
-                                   size_t sizes[], void* chunks[]) {
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-    return 0;
-  }
-  return ialloc(ms, n_elements, sizes, 0, chunks);
-}
-
-size_t mspace_bulk_free(mspace msp, void* array[], size_t nelem) {
-  return internal_bulk_free((mstate)msp, array, nelem);
-}
-
-#if MALLOC_INSPECT_ALL
-void mspace_inspect_all(mspace msp,
-                        void(*handler)(void *start,
-                                       void *end,
-                                       size_t used_bytes,
-                                       void* callback_arg),
-                        void* arg) {
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    if (!PREACTION(ms)) {
-      internal_inspect_all(ms, handler, arg);
-      POSTACTION(ms);
-    }
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-}
-#endif /* MALLOC_INSPECT_ALL */
-
-int mspace_trim(mspace msp, size_t pad) {
-  int result = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    if (!PREACTION(ms)) {
-      result = sys_trim(ms, pad);
-      POSTACTION(ms);
-    }
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return result;
-}
-
-#if !NO_MALLOC_STATS
-void mspace_malloc_stats(mspace msp) {
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    internal_malloc_stats(ms);
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-}
-#endif /* NO_MALLOC_STATS */
-
-size_t mspace_footprint(mspace msp) {
-  size_t result = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    result = ms->footprint;
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return result;
-}
-
-size_t mspace_max_footprint(mspace msp) {
-  size_t result = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    result = ms->max_footprint;
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return result;
-}
-
-size_t mspace_footprint_limit(mspace msp) {
-  size_t result = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    size_t maf = ms->footprint_limit;
-    result = (maf == 0) ? MAX_SIZE_T : maf;
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return result;
-}
-
-size_t mspace_set_footprint_limit(mspace msp, size_t bytes) {
-  size_t result = 0;
-  mstate ms = (mstate)msp;
-  if (ok_magic(ms)) {
-    if (bytes == 0)
-      result = granularity_align(1); /* Use minimal size */
-    if (bytes == MAX_SIZE_T)
-      result = 0;                    /* disable */
-    else
-      result = granularity_align(bytes);
-    ms->footprint_limit = result;
-  }
-  else {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return result;
-}
-
-#if !NO_MALLINFO
-struct mallinfo mspace_mallinfo(mspace msp) {
-  mstate ms = (mstate)msp;
-  if (!ok_magic(ms)) {
-    USAGE_ERROR_ACTION(ms,ms);
-  }
-  return internal_mallinfo(ms);
-}
-#endif /* NO_MALLINFO */
-
-size_t mspace_usable_size(const void* mem) {
-  if (mem != 0) {
-    mchunkptr p = mem2chunk(mem);
-    if (is_inuse(p))
-      return chunksize(p) - overhead_for(p);
-  }
-  return 0;
-}
-
-int mspace_mallopt(int param_number, int value) {
-  return change_mparam(param_number, value);
-}
-
-#endif /* MSPACES */
-
-
-/* -------------------- Alternative MORECORE functions ------------------- */
-
-/*
-  Guidelines for creating a custom version of MORECORE:
-
-  * For best performance, MORECORE should allocate in multiples of pagesize.
-  * MORECORE may allocate more memory than requested. (Or even less,
-      but this will usually result in a malloc failure.)
-  * MORECORE must not allocate memory when given argument zero, but
-      instead return one past the end address of memory from previous
-      nonzero call.
-  * For best performance, consecutive calls to MORECORE with positive
-      arguments should return increasing addresses, indicating that
-      space has been contiguously extended.
-  * Even though consecutive calls to MORECORE need not return contiguous
-      addresses, it must be OK for malloc'ed chunks to span multiple
-      regions in those cases where they do happen to be contiguous.
-  * MORECORE need not handle negative arguments -- it may instead
-      just return MFAIL when given negative arguments.
-      Negative arguments are always multiples of pagesize. MORECORE
-      must not misinterpret negative args as large positive unsigned
-      args. You can suppress all such calls from even occurring by defining
-      MORECORE_CANNOT_TRIM,
-
-  As an example alternative MORECORE, here is a custom allocator
-  kindly contributed for pre-OSX macOS.  It uses virtually but not
-  necessarily physically contiguous non-paged memory (locked in,
-  present and won't get swapped out).  You can use it by uncommenting
-  this section, adding some #includes, and setting up the appropriate
-  defines above:
-
-      #define MORECORE osMoreCore
-
-  There is also a shutdown routine that should somehow be called for
-  cleanup upon program exit.
-
-  #define MAX_POOL_ENTRIES 100
-  #define MINIMUM_MORECORE_SIZE  (64 * 1024U)
-  static int next_os_pool;
-  void *our_os_pools[MAX_POOL_ENTRIES];
-
-  void *osMoreCore(int size)
-  {
-    void *ptr = 0;
-    static void *sbrk_top = 0;
-
-    if (size > 0)
-    {
-      if (size < MINIMUM_MORECORE_SIZE)
-         size = MINIMUM_MORECORE_SIZE;
-      if (CurrentExecutionLevel() == kTaskLevel)
-         ptr = PoolAllocateResident(size + RM_PAGE_SIZE, 0);
-      if (ptr == 0)
-      {
-        return (void *) MFAIL;
-      }
-      // save ptrs so they can be freed during cleanup
-      our_os_pools[next_os_pool] = ptr;
-      next_os_pool++;
-      ptr = (void *) ((((size_t) ptr) + RM_PAGE_MASK) & ~RM_PAGE_MASK);
-      sbrk_top = (char *) ptr + size;
-      return ptr;
-    }
-    else if (size < 0)
-    {
-      // we don't currently support shrink behavior
-      return (void *) MFAIL;
-    }
-    else
-    {
-      return sbrk_top;
-    }
-  }
-
-  // cleanup any allocated memory pools
-  // called as last thing before shutting down driver
-
-  void osCleanupMem(void)
-  {
-    void **ptr;
-
-    for (ptr = our_os_pools; ptr < &our_os_pools[MAX_POOL_ENTRIES]; ptr++)
-      if (*ptr)
-      {
-         PoolDeallocate(*ptr);
-         *ptr = 0;
-      }
-  }
-
-*/
-
-
-/* -----------------------------------------------------------------------
-History:
-    v2.8.6 Wed Aug 29 06:57:58 2012  Doug Lea
-      * fix bad comparison in dlposix_memalign
-      * don't reuse adjusted asize in sys_alloc
-      * add LOCK_AT_FORK -- thanks to Kirill Artamonov for the suggestion
-      * reduce compiler warnings -- thanks to all who reported/suggested these
-
-    v2.8.5 Sun May 22 10:26:02 2011  Doug Lea  (dl at gee)
-      * Always perform unlink checks unless INSECURE
-      * Add posix_memalign.
-      * Improve realloc to expand in more cases; expose realloc_in_place.
-        Thanks to Peter Buhr for the suggestion.
-      * Add footprint_limit, inspect_all, bulk_free. Thanks
-        to Barry Hayes and others for the suggestions.
-      * Internal refactorings to avoid calls while holding locks
-      * Use non-reentrant locks by default. Thanks to Roland McGrath
-        for the suggestion.
-      * Small fixes to mspace_destroy, reset_on_error.
-      * Various configuration extensions/changes. Thanks
-         to all who contributed these.
-
-    V2.8.4a Thu Apr 28 14:39:43 2011 (dl at gee.cs.oswego.edu)
-      * Update Creative Commons URL
-
-    V2.8.4 Wed May 27 09:56:23 2009  Doug Lea  (dl at gee)
-      * Use zeros instead of prev foot for is_mmapped
-      * Add mspace_track_large_chunks; thanks to Jean Brouwers
-      * Fix set_inuse in internal_realloc; thanks to Jean Brouwers
-      * Fix insufficient sys_alloc padding when using 16byte alignment
-      * Fix bad error check in mspace_footprint
-      * Adaptations for ptmalloc; thanks to Wolfram Gloger.
-      * Reentrant spin locks; thanks to Earl Chew and others
-      * Win32 improvements; thanks to Niall Douglas and Earl Chew
-      * Add NO_SEGMENT_TRAVERSAL and MAX_RELEASE_CHECK_RATE options
-      * Extension hook in malloc_state
-      * Various small adjustments to reduce warnings on some compilers
-      * Various configuration extensions/changes for more platforms. Thanks
-         to all who contributed these.
-
-    V2.8.3 Thu Sep 22 11:16:32 2005  Doug Lea  (dl at gee)
-      * Add max_footprint functions
-      * Ensure all appropriate literals are size_t
-      * Fix conditional compilation problem for some #define settings
-      * Avoid concatenating segments with the one provided
-        in create_mspace_with_base
-      * Rename some variables to avoid compiler shadowing warnings
-      * Use explicit lock initialization.
-      * Better handling of sbrk interference.
-      * Simplify and fix segment insertion, trimming and mspace_destroy
-      * Reinstate REALLOC_ZERO_BYTES_FREES option from 2.7.x
-      * Thanks especially to Dennis Flanagan for help on these.
-
-    V2.8.2 Sun Jun 12 16:01:10 2005  Doug Lea  (dl at gee)
-      * Fix memalign brace error.
-
-    V2.8.1 Wed Jun  8 16:11:46 2005  Doug Lea  (dl at gee)
-      * Fix improper #endif nesting in C++
-      * Add explicit casts needed for C++
-
-    V2.8.0 Mon May 30 14:09:02 2005  Doug Lea  (dl at gee)
-      * Use trees for large bins
-      * Support mspaces
-      * Use segments to unify sbrk-based and mmap-based system allocation,
-        removing need for emulation on most platforms without sbrk.
-      * Default safety checks
-      * Optional footer checks. Thanks to William Robertson for the idea.
-      * Internal code refactoring
-      * Incorporate suggestions and platform-specific changes.
-        Thanks to Dennis Flanagan, Colin Plumb, Niall Douglas,
-        Aaron Bachmann,  Emery Berger, and others.
-      * Speed up non-fastbin processing enough to remove fastbins.
-      * Remove useless cfree() to avoid conflicts with other apps.
-      * Remove internal memcpy, memset. Compilers handle builtins better.
-      * Remove some options that no one ever used and rename others.
-
-    V2.7.2 Sat Aug 17 09:07:30 2002  Doug Lea  (dl at gee)
-      * Fix malloc_state bitmap array misdeclaration
-
-    V2.7.1 Thu Jul 25 10:58:03 2002  Doug Lea  (dl at gee)
-      * Allow tuning of FIRST_SORTED_BIN_SIZE
-      * Use PTR_UINT as type for all ptr->int casts. Thanks to John Belmonte.
-      * Better detection and support for non-contiguousness of MORECORE.
-        Thanks to Andreas Mueller, Conal Walsh, and Wolfram Gloger
-      * Bypass most of malloc if no frees. Thanks To Emery Berger.
-      * Fix freeing of old top non-contiguous chunk im sysmalloc.
-      * Raised default trim and map thresholds to 256K.
-      * Fix mmap-related #defines. Thanks to Lubos Lunak.
-      * Fix copy macros; added LACKS_FCNTL_H. Thanks to Neal Walfield.
-      * Branch-free bin calculation
-      * Default trim and mmap thresholds now 256K.
-
-    V2.7.0 Sun Mar 11 14:14:06 2001  Doug Lea  (dl at gee)
-      * Introduce independent_comalloc and independent_calloc.
-        Thanks to Michael Pachos for motivation and help.
-      * Make optional .h file available
-      * Allow > 2GB requests on 32bit systems.
-      * new WIN32 sbrk, mmap, munmap, lock code from <Walter@GeNeSys-e.de>.
-        Thanks also to Andreas Mueller <a.mueller at paradatec.de>,
-        and Anonymous.
-      * Allow override of MALLOC_ALIGNMENT (Thanks to Ruud Waij for
-        helping test this.)
-      * memalign: check alignment arg
-      * realloc: don't try to shift chunks backwards, since this
-        leads to  more fragmentation in some programs and doesn't
-        seem to help in any others.
-      * Collect all cases in malloc requiring system memory into sysmalloc
-      * Use mmap as backup to sbrk
-      * Place all internal state in malloc_state
-      * Introduce fastbins (although similar to 2.5.1)
-      * Many minor tunings and cosmetic improvements
-      * Introduce USE_PUBLIC_MALLOC_WRAPPERS, USE_MALLOC_LOCK
-      * Introduce MALLOC_FAILURE_ACTION, MORECORE_CONTIGUOUS
-        Thanks to Tony E. Bennett <tbennett@nvidia.com> and others.
-      * Include errno.h to support default failure action.
-
-    V2.6.6 Sun Dec  5 07:42:19 1999  Doug Lea  (dl at gee)
-      * return null for negative arguments
-      * Added Several WIN32 cleanups from Martin C. Fong <mcfong at yahoo.com>
-         * Add 'LACKS_SYS_PARAM_H' for those systems without 'sys/param.h'
-          (e.g. WIN32 platforms)
-         * Cleanup header file inclusion for WIN32 platforms
-         * Cleanup code to avoid Microsoft Visual C++ compiler complaints
-         * Add 'USE_DL_PREFIX' to quickly allow co-existence with existing
-           memory allocation routines
-         * Set 'malloc_getpagesize' for WIN32 platforms (needs more work)
-         * Use 'assert' rather than 'ASSERT' in WIN32 code to conform to
-           usage of 'assert' in non-WIN32 code
-         * Improve WIN32 'sbrk()' emulation's 'findRegion()' routine to
-           avoid infinite loop
-      * Always call 'fREe()' rather than 'free()'
-
-    V2.6.5 Wed Jun 17 15:57:31 1998  Doug Lea  (dl at gee)
-      * Fixed ordering problem with boundary-stamping
-
-    V2.6.3 Sun May 19 08:17:58 1996  Doug Lea  (dl at gee)
-      * Added pvalloc, as recommended by H.J. Liu
-      * Added 64bit pointer support mainly from Wolfram Gloger
-      * Added anonymously donated WIN32 sbrk emulation
-      * Malloc, calloc, getpagesize: add optimizations from Raymond Nijssen
-      * malloc_extend_top: fix mask error that caused wastage after
-        foreign sbrks
-      * Add linux mremap support code from HJ Liu
-
-    V2.6.2 Tue Dec  5 06:52:55 1995  Doug Lea  (dl at gee)
-      * Integrated most documentation with the code.
-      * Add support for mmap, with help from
-        Wolfram Gloger (Gloger@lrz.uni-muenchen.de).
-      * Use last_remainder in more cases.
-      * Pack bins using idea from  colin@nyx10.cs.du.edu
-      * Use ordered bins instead of best-fit threshhold
-      * Eliminate block-local decls to simplify tracing and debugging.
-      * Support another case of realloc via move into top
-      * Fix error occuring when initial sbrk_base not word-aligned.
-      * Rely on page size for units instead of SBRK_UNIT to
-        avoid surprises about sbrk alignment conventions.
-      * Add mallinfo, mallopt. Thanks to Raymond Nijssen
-        (raymond@es.ele.tue.nl) for the suggestion.
-      * Add `pad' argument to malloc_trim and top_pad mallopt parameter.
-      * More precautions for cases where other routines call sbrk,
-        courtesy of Wolfram Gloger (Gloger@lrz.uni-muenchen.de).
-      * Added macros etc., allowing use in linux libc from
-        H.J. Lu (hjl@gnu.ai.mit.edu)
-      * Inverted this history list
-
-    V2.6.1 Sat Dec  2 14:10:57 1995  Doug Lea  (dl at gee)
-      * Re-tuned and fixed to behave more nicely with V2.6.0 changes.
-      * Removed all preallocation code since under current scheme
-        the work required to undo bad preallocations exceeds
-        the work saved in good cases for most test programs.
-      * No longer use return list or unconsolidated bins since
-        no scheme using them consistently outperforms those that don't
-        given above changes.
-      * Use best fit for very large chunks to prevent some worst-cases.
-      * Added some support for debugging
-
-    V2.6.0 Sat Nov  4 07:05:23 1995  Doug Lea  (dl at gee)
-      * Removed footers when chunks are in use. Thanks to
-        Paul Wilson (wilson@cs.texas.edu) for the suggestion.
-
-    V2.5.4 Wed Nov  1 07:54:51 1995  Doug Lea  (dl at gee)
-      * Added malloc_trim, with help from Wolfram Gloger
-        (wmglo@Dent.MED.Uni-Muenchen.DE).
-
-    V2.5.3 Tue Apr 26 10:16:01 1994  Doug Lea  (dl at g)
-
-    V2.5.2 Tue Apr  5 16:20:40 1994  Doug Lea  (dl at g)
-      * realloc: try to expand in both directions
-      * malloc: swap order of clean-bin strategy;
-      * realloc: only conditionally expand backwards
-      * Try not to scavenge used bins
-      * Use bin counts as a guide to preallocation
-      * Occasionally bin return list chunks in first scan
-      * Add a few optimizations from colin@nyx10.cs.du.edu
-
-    V2.5.1 Sat Aug 14 15:40:43 1993  Doug Lea  (dl at g)
-      * faster bin computation & slightly different binning
-      * merged all consolidations to one part of malloc proper
-         (eliminating old malloc_find_space & malloc_clean_bin)
-      * Scan 2 returns chunks (not just 1)
-      * Propagate failure in realloc if malloc returns 0
-      * Add stuff to allow compilation on non-ANSI compilers
-          from kpv@research.att.com
-
-    V2.5 Sat Aug  7 07:41:59 1993  Doug Lea  (dl at g.oswego.edu)
-      * removed potential for odd address access in prev_chunk
-      * removed dependency on getpagesize.h
-      * misc cosmetics and a bit more internal documentation
-      * anticosmetics: mangled names in macros to evade debugger strangeness
-      * tested on sparc, hp-700, dec-mips, rs6000
-          with gcc & native cc (hp, dec only) allowing
-          Detlefs & Zorn comparison study (in SIGPLAN Notices.)
-
-    Trial version Fri Aug 28 13:14:29 1992  Doug Lea  (dl at g.oswego.edu)
-      * Based loosely on libg++-1.2X malloc. (It retains some of the overall
-         structure of old version,  but most details differ.)
-
-*/
diff --git a/src/plasma/thirdparty/xxhash.c b/src/plasma/thirdparty/xxhash.c
deleted file mode 100644
index f74880b0de71d..0000000000000
--- a/src/plasma/thirdparty/xxhash.c
+++ /dev/null
@@ -1,889 +0,0 @@
-/*
-*  xxHash - Fast Hash algorithm
-*  Copyright (C) 2012-2016, Yann Collet
-*
-*  BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
-*
-*  Redistribution and use in source and binary forms, with or without
-*  modification, are permitted provided that the following conditions are
-*  met:
-*
-*  * Redistributions of source code must retain the above copyright
-*  notice, this list of conditions and the following disclaimer.
-*  * Redistributions in binary form must reproduce the above
-*  copyright notice, this list of conditions and the following disclaimer
-*  in the documentation and/or other materials provided with the
-*  distribution.
-*
-*  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
-*  "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
-*  LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
-*  A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
-*  OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
-*  SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
-*  LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
-*  DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
-*  THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-*  (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
-*  OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-*
-*  You can contact the author at :
-*  - xxHash homepage: http://www.xxhash.com
-*  - xxHash source repository : https://github.com/Cyan4973/xxHash
-*/
-
-
-/* *************************************
-*  Tuning parameters
-***************************************/
-/*!XXH_FORCE_MEMORY_ACCESS :
- * By default, access to unaligned memory is controlled by `memcpy()`, which is safe and portable.
- * Unfortunately, on some target/compiler combinations, the generated assembly is sub-optimal.
- * The below switch allow to select different access method for improved performance.
- * Method 0 (default) : use `memcpy()`. Safe and portable.
- * Method 1 : `__packed` statement. It depends on compiler extension (ie, not portable).
- *            This method is safe if your compiler supports it, and *generally* as fast or faster than `memcpy`.
- * Method 2 : direct access. This method doesn't depend on compiler but violate C standard.
- *            It can generate buggy code on targets which do not support unaligned memory accesses.
- *            But in some circumstances, it's the only known way to get the most performance (ie GCC + ARMv6)
- * See http://stackoverflow.com/a/32095106/646947 for details.
- * Prefer these methods in priority order (0 > 1 > 2)
- */
-#ifndef XXH_FORCE_MEMORY_ACCESS   /* can be defined externally, on command line for example */
-#  if defined(__GNUC__) && ( defined(__ARM_ARCH_6__) || defined(__ARM_ARCH_6J__) || defined(__ARM_ARCH_6K__) || defined(__ARM_ARCH_6Z__) || defined(__ARM_ARCH_6ZK__) || defined(__ARM_ARCH_6T2__) )
-#    define XXH_FORCE_MEMORY_ACCESS 2
-#  elif defined(__INTEL_COMPILER) || \
-  (defined(__GNUC__) && ( defined(__ARM_ARCH_7__) || defined(__ARM_ARCH_7A__) || defined(__ARM_ARCH_7R__) || defined(__ARM_ARCH_7M__) || defined(__ARM_ARCH_7S__) ))
-#    define XXH_FORCE_MEMORY_ACCESS 1
-#  endif
-#endif
-
-/*!XXH_ACCEPT_NULL_INPUT_POINTER :
- * If the input pointer is a null pointer, xxHash default behavior is to trigger a memory access error, since it is a bad pointer.
- * When this option is enabled, xxHash output for null input pointers will be the same as a null-length input.
- * By default, this option is disabled. To enable it, uncomment below define :
- */
-/* #define XXH_ACCEPT_NULL_INPUT_POINTER 1 */
-
-/*!XXH_FORCE_NATIVE_FORMAT :
- * By default, xxHash library provides endian-independent Hash values, based on little-endian convention.
- * Results are therefore identical for little-endian and big-endian CPU.
- * This comes at a performance cost for big-endian CPU, since some swapping is required to emulate little-endian format.
- * Should endian-independence be of no importance for your application, you may set the #define below to 1,
- * to improve speed for Big-endian CPU.
- * This option has no impact on Little_Endian CPU.
- */
-#ifndef XXH_FORCE_NATIVE_FORMAT   /* can be defined externally */
-#  define XXH_FORCE_NATIVE_FORMAT 0
-#endif
-
-/*!XXH_FORCE_ALIGN_CHECK :
- * This is a minor performance trick, only useful with lots of very small keys.
- * It means : check for aligned/unaligned input.
- * The check costs one initial branch per hash; set to 0 when the input data
- * is guaranteed to be aligned.
- */
-#ifndef XXH_FORCE_ALIGN_CHECK /* can be defined externally */
-#  if defined(__i386) || defined(_M_IX86) || defined(__x86_64__) || defined(_M_X64)
-#    define XXH_FORCE_ALIGN_CHECK 0
-#  else
-#    define XXH_FORCE_ALIGN_CHECK 1
-#  endif
-#endif
-
-
-/* *************************************
-*  Includes & Memory related functions
-***************************************/
-/*! Modify the local functions below should you wish to use some other memory routines
-*   for malloc(), free() */
-#include <stdlib.h>
-static void* XXH_malloc(size_t s) { return malloc(s); }
-static void  XXH_free  (void* p)  { free(p); }
-/*! and for memcpy() */
-#include <string.h>
-static void* XXH_memcpy(void* dest, const void* src, size_t size) { return memcpy(dest,src,size); }
-
-#define XXH_STATIC_LINKING_ONLY
-#include "xxhash.h"
-
-
-/* *************************************
-*  Compiler Specific Options
-***************************************/
-#ifdef _MSC_VER    /* Visual Studio */
-#  pragma warning(disable : 4127)      /* disable: C4127: conditional expression is constant */
-#  define FORCE_INLINE static __forceinline
-#else
-#  if defined (__cplusplus) || defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L   /* C99 */
-#    ifdef __GNUC__
-#      define FORCE_INLINE static inline __attribute__((always_inline))
-#    else
-#      define FORCE_INLINE static inline
-#    endif
-#  else
-#    define FORCE_INLINE static
-#  endif /* __STDC_VERSION__ */
-#endif
-
-
-/* *************************************
-*  Basic Types
-***************************************/
-#ifndef MEM_MODULE
-# if !defined (__VMS) && (defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */) )
-#   include <stdint.h>
-    typedef uint8_t  BYTE;
-    typedef uint16_t U16;
-    typedef uint32_t U32;
-    typedef  int32_t S32;
-# else
-    typedef unsigned char      BYTE;
-    typedef unsigned short     U16;
-    typedef unsigned int       U32;
-    typedef   signed int       S32;
-# endif
-#endif
-
-#if (defined(XXH_FORCE_MEMORY_ACCESS) && (XXH_FORCE_MEMORY_ACCESS==2))
-
-/* Force direct memory access. Only works on CPU which support unaligned memory access in hardware */
-static U32 XXH_read32(const void* memPtr) { return *(const U32*) memPtr; }
-
-#elif (defined(XXH_FORCE_MEMORY_ACCESS) && (XXH_FORCE_MEMORY_ACCESS==1))
-
-/* __pack instructions are safer, but compiler specific, hence potentially problematic for some compilers */
-/* currently only defined for gcc and icc */
-typedef union { U32 u32; } __attribute__((packed)) unalign;
-static U32 XXH_read32(const void* ptr) { return ((const unalign*)ptr)->u32; }
-
-#else
-
-/* portable and safe solution. Generally efficient.
- * see : http://stackoverflow.com/a/32095106/646947
- */
-static U32 XXH_read32(const void* memPtr)
-{
-    U32 val;
-    memcpy(&val, memPtr, sizeof(val));
-    return val;
-}
-
-#endif   /* XXH_FORCE_DIRECT_MEMORY_ACCESS */
-
-
-/* ****************************************
-*  Compiler-specific Functions and Macros
-******************************************/
-#define XXH_GCC_VERSION (__GNUC__ * 100 + __GNUC_MINOR__)
-
-/* Note : although _rotl exists for minGW (GCC under windows), performance seems poor */
-#if defined(_MSC_VER)
-#  define XXH_rotl32(x,r) _rotl(x,r)
-#  define XXH_rotl64(x,r) _rotl64(x,r)
-#else
-#  define XXH_rotl32(x,r) ((x << r) | (x >> (32 - r)))
-#  define XXH_rotl64(x,r) ((x << r) | (x >> (64 - r)))
-#endif
-
-#if defined(_MSC_VER)     /* Visual Studio */
-#  define XXH_swap32 _byteswap_ulong
-#elif XXH_GCC_VERSION >= 403
-#  define XXH_swap32 __builtin_bswap32
-#else
-static U32 XXH_swap32 (U32 x)
-{
-    return  ((x << 24) & 0xff000000 ) |
-            ((x <<  8) & 0x00ff0000 ) |
-            ((x >>  8) & 0x0000ff00 ) |
-            ((x >> 24) & 0x000000ff );
-}
-#endif
-
-
-/* *************************************
-*  Architecture Macros
-***************************************/
-typedef enum { XXH_bigEndian=0, XXH_littleEndian=1 } XXH_endianess;
-
-/* XXH_CPU_LITTLE_ENDIAN can be defined externally, for example on the compiler command line */
-#ifndef XXH_CPU_LITTLE_ENDIAN
-    static const int g_one = 1;
-#   define XXH_CPU_LITTLE_ENDIAN   (*(const char*)(&g_one))
-#endif
-
-
-/* ***************************
-*  Memory reads
-*****************************/
-typedef enum { XXH_aligned, XXH_unaligned } XXH_alignment;
-
-FORCE_INLINE U32 XXH_readLE32_align(const void* ptr, XXH_endianess endian, XXH_alignment align)
-{
-    if (align==XXH_unaligned)
-        return endian==XXH_littleEndian ? XXH_read32(ptr) : XXH_swap32(XXH_read32(ptr));
-    else
-        return endian==XXH_littleEndian ? *(const U32*)ptr : XXH_swap32(*(const U32*)ptr);
-}
-
-FORCE_INLINE U32 XXH_readLE32(const void* ptr, XXH_endianess endian)
-{
-    return XXH_readLE32_align(ptr, endian, XXH_unaligned);
-}
-
-static U32 XXH_readBE32(const void* ptr)
-{
-    return XXH_CPU_LITTLE_ENDIAN ? XXH_swap32(XXH_read32(ptr)) : XXH_read32(ptr);
-}
-
-
-/* *************************************
-*  Macros
-***************************************/
-#define XXH_STATIC_ASSERT(c)   { enum { XXH_static_assert = 1/(int)(!!(c)) }; }    /* use only *after* variable declarations */
-XXH_PUBLIC_API unsigned XXH_versionNumber (void) { return XXH_VERSION_NUMBER; }
-
-
-/* *******************************************************************
-*  32-bits hash functions
-*********************************************************************/
-static const U32 PRIME32_1 = 2654435761U;
-static const U32 PRIME32_2 = 2246822519U;
-static const U32 PRIME32_3 = 3266489917U;
-static const U32 PRIME32_4 =  668265263U;
-static const U32 PRIME32_5 =  374761393U;
-
-static U32 XXH32_round(U32 seed, U32 input)
-{
-    seed += input * PRIME32_2;
-    seed  = XXH_rotl32(seed, 13);
-    seed *= PRIME32_1;
-    return seed;
-}
-
-FORCE_INLINE U32 XXH32_endian_align(const void* input, size_t len, U32 seed, XXH_endianess endian, XXH_alignment align)
-{
-    const BYTE* p = (const BYTE*)input;
-    const BYTE* bEnd = p + len;
-    U32 h32;
-#define XXH_get32bits(p) XXH_readLE32_align(p, endian, align)
-
-#ifdef XXH_ACCEPT_NULL_INPUT_POINTER
-    if (p==NULL) {
-        len=0;
-        bEnd=p=(const BYTE*)(size_t)16;
-    }
-#endif
-
-    if (len>=16) {
-        const BYTE* const limit = bEnd - 16;
-        U32 v1 = seed + PRIME32_1 + PRIME32_2;
-        U32 v2 = seed + PRIME32_2;
-        U32 v3 = seed + 0;
-        U32 v4 = seed - PRIME32_1;
-
-        do {
-            v1 = XXH32_round(v1, XXH_get32bits(p)); p+=4;
-            v2 = XXH32_round(v2, XXH_get32bits(p)); p+=4;
-            v3 = XXH32_round(v3, XXH_get32bits(p)); p+=4;
-            v4 = XXH32_round(v4, XXH_get32bits(p)); p+=4;
-        } while (p<=limit);
-
-        h32 = XXH_rotl32(v1, 1) + XXH_rotl32(v2, 7) + XXH_rotl32(v3, 12) + XXH_rotl32(v4, 18);
-    } else {
-        h32  = seed + PRIME32_5;
-    }
-
-    h32 += (U32) len;
-
-    while (p+4<=bEnd) {
-        h32 += XXH_get32bits(p) * PRIME32_3;
-        h32  = XXH_rotl32(h32, 17) * PRIME32_4 ;
-        p+=4;
-    }
-
-    while (p<bEnd) {
-        h32 += (*p) * PRIME32_5;
-        h32 = XXH_rotl32(h32, 11) * PRIME32_1 ;
-        p++;
-    }
-
-    h32 ^= h32 >> 15;
-    h32 *= PRIME32_2;
-    h32 ^= h32 >> 13;
-    h32 *= PRIME32_3;
-    h32 ^= h32 >> 16;
-
-    return h32;
-}
-
-
-XXH_PUBLIC_API unsigned int XXH32 (const void* input, size_t len, unsigned int seed)
-{
-#if 0
-    /* Simple version, good for code maintenance, but unfortunately slow for small inputs */
-    XXH32_state_t state;
-    XXH32_reset(&state, seed);
-    XXH32_update(&state, input, len);
-    return XXH32_digest(&state);
-#else
-    XXH_endianess endian_detected = (XXH_endianess)XXH_CPU_LITTLE_ENDIAN;
-
-    if (XXH_FORCE_ALIGN_CHECK) {
-        if ((((size_t)input) & 3) == 0) {   /* Input is 4-bytes aligned, leverage the speed benefit */
-            if ((endian_detected==XXH_littleEndian) || XXH_FORCE_NATIVE_FORMAT)
-                return XXH32_endian_align(input, len, seed, XXH_littleEndian, XXH_aligned);
-            else
-                return XXH32_endian_align(input, len, seed, XXH_bigEndian, XXH_aligned);
-    }   }
-
-    if ((endian_detected==XXH_littleEndian) || XXH_FORCE_NATIVE_FORMAT)
-        return XXH32_endian_align(input, len, seed, XXH_littleEndian, XXH_unaligned);
-    else
-        return XXH32_endian_align(input, len, seed, XXH_bigEndian, XXH_unaligned);
-#endif
-}
-
-
-
-/*======   Hash streaming   ======*/
-
-XXH_PUBLIC_API XXH32_state_t* XXH32_createState(void)
-{
-    return (XXH32_state_t*)XXH_malloc(sizeof(XXH32_state_t));
-}
-XXH_PUBLIC_API XXH_errorcode XXH32_freeState(XXH32_state_t* statePtr)
-{
-    XXH_free(statePtr);
-    return XXH_OK;
-}
-
-XXH_PUBLIC_API void XXH32_copyState(XXH32_state_t* dstState, const XXH32_state_t* srcState)
-{
-    memcpy(dstState, srcState, sizeof(*dstState));
-}
-
-XXH_PUBLIC_API XXH_errorcode XXH32_reset(XXH32_state_t* statePtr, unsigned int seed)
-{
-    XXH32_state_t state;   /* using a local state to memcpy() in order to avoid strict-aliasing warnings */
-    memset(&state, 0, sizeof(state)-4);   /* do not write into reserved, for future removal */
-    state.v1 = seed + PRIME32_1 + PRIME32_2;
-    state.v2 = seed + PRIME32_2;
-    state.v3 = seed + 0;
-    state.v4 = seed - PRIME32_1;
-    memcpy(statePtr, &state, sizeof(state));
-    return XXH_OK;
-}
-
-
-FORCE_INLINE XXH_errorcode XXH32_update_endian (XXH32_state_t* state, const void* input, size_t len, XXH_endianess endian)
-{
-    const BYTE* p = (const BYTE*)input;
-    const BYTE* const bEnd = p + len;
-
-#ifdef XXH_ACCEPT_NULL_INPUT_POINTER
-    if (input==NULL) return XXH_ERROR;
-#endif
-
-    state->total_len_32 += (unsigned)len;
-    state->large_len |= (len>=16) | (state->total_len_32>=16);
-
-    if (state->memsize + len < 16)  {   /* fill in tmp buffer */
-        XXH_memcpy((BYTE*)(state->mem32) + state->memsize, input, len);
-        state->memsize += (unsigned)len;
-        return XXH_OK;
-    }
-
-    if (state->memsize) {   /* some data left from previous update */
-        XXH_memcpy((BYTE*)(state->mem32) + state->memsize, input, 16-state->memsize);
-        {   const U32* p32 = state->mem32;
-            state->v1 = XXH32_round(state->v1, XXH_readLE32(p32, endian)); p32++;
-            state->v2 = XXH32_round(state->v2, XXH_readLE32(p32, endian)); p32++;
-            state->v3 = XXH32_round(state->v3, XXH_readLE32(p32, endian)); p32++;
-            state->v4 = XXH32_round(state->v4, XXH_readLE32(p32, endian)); p32++;
-        }
-        p += 16-state->memsize;
-        state->memsize = 0;
-    }
-
-    if (p <= bEnd-16) {
-        const BYTE* const limit = bEnd - 16;
-        U32 v1 = state->v1;
-        U32 v2 = state->v2;
-        U32 v3 = state->v3;
-        U32 v4 = state->v4;
-
-        do {
-            v1 = XXH32_round(v1, XXH_readLE32(p, endian)); p+=4;
-            v2 = XXH32_round(v2, XXH_readLE32(p, endian)); p+=4;
-            v3 = XXH32_round(v3, XXH_readLE32(p, endian)); p+=4;
-            v4 = XXH32_round(v4, XXH_readLE32(p, endian)); p+=4;
-        } while (p<=limit);
-
-        state->v1 = v1;
-        state->v2 = v2;
-        state->v3 = v3;
-        state->v4 = v4;
-    }
-
-    if (p < bEnd) {
-        XXH_memcpy(state->mem32, p, (size_t)(bEnd-p));
-        state->memsize = (unsigned)(bEnd-p);
-    }
-
-    return XXH_OK;
-}
-
-XXH_PUBLIC_API XXH_errorcode XXH32_update (XXH32_state_t* state_in, const void* input, size_t len)
-{
-    XXH_endianess endian_detected = (XXH_endianess)XXH_CPU_LITTLE_ENDIAN;
-
-    if ((endian_detected==XXH_littleEndian) || XXH_FORCE_NATIVE_FORMAT)
-        return XXH32_update_endian(state_in, input, len, XXH_littleEndian);
-    else
-        return XXH32_update_endian(state_in, input, len, XXH_bigEndian);
-}
-
-
-
-FORCE_INLINE U32 XXH32_digest_endian (const XXH32_state_t* state, XXH_endianess endian)
-{
-    const BYTE * p = (const BYTE*)state->mem32;
-    const BYTE* const bEnd = (const BYTE*)(state->mem32) + state->memsize;
-    U32 h32;
-
-    if (state->large_len) {
-        h32 = XXH_rotl32(state->v1, 1) + XXH_rotl32(state->v2, 7) + XXH_rotl32(state->v3, 12) + XXH_rotl32(state->v4, 18);
-    } else {
-        h32 = state->v3 /* == seed */ + PRIME32_5;
-    }
-
-    h32 += state->total_len_32;
-
-    while (p+4<=bEnd) {
-        h32 += XXH_readLE32(p, endian) * PRIME32_3;
-        h32  = XXH_rotl32(h32, 17) * PRIME32_4;
-        p+=4;
-    }
-
-    while (p<bEnd) {
-        h32 += (*p) * PRIME32_5;
-        h32  = XXH_rotl32(h32, 11) * PRIME32_1;
-        p++;
-    }
-
-    h32 ^= h32 >> 15;
-    h32 *= PRIME32_2;
-    h32 ^= h32 >> 13;
-    h32 *= PRIME32_3;
-    h32 ^= h32 >> 16;
-
-    return h32;
-}
-
-
-XXH_PUBLIC_API unsigned int XXH32_digest (const XXH32_state_t* state_in)
-{
-    XXH_endianess endian_detected = (XXH_endianess)XXH_CPU_LITTLE_ENDIAN;
-
-    if ((endian_detected==XXH_littleEndian) || XXH_FORCE_NATIVE_FORMAT)
-        return XXH32_digest_endian(state_in, XXH_littleEndian);
-    else
-        return XXH32_digest_endian(state_in, XXH_bigEndian);
-}
-
-
-/*======   Canonical representation   ======*/
-
-/*! Default XXH result types are basic unsigned 32 and 64 bits.
-*   The canonical representation follows human-readable write convention, aka big-endian (large digits first).
-*   These functions allow transformation of hash result into and from its canonical format.
-*   This way, hash values can be written into a file or buffer, and remain comparable across different systems and programs.
-*/
-
-XXH_PUBLIC_API void XXH32_canonicalFromHash(XXH32_canonical_t* dst, XXH32_hash_t hash)
-{
-    XXH_STATIC_ASSERT(sizeof(XXH32_canonical_t) == sizeof(XXH32_hash_t));
-    if (XXH_CPU_LITTLE_ENDIAN) hash = XXH_swap32(hash);
-    memcpy(dst, &hash, sizeof(*dst));
-}
-
-XXH_PUBLIC_API XXH32_hash_t XXH32_hashFromCanonical(const XXH32_canonical_t* src)
-{
-    return XXH_readBE32(src);
-}
-
-
-#ifndef XXH_NO_LONG_LONG
-
-/* *******************************************************************
-*  64-bits hash functions
-*********************************************************************/
-
-/*======   Memory access   ======*/
-
-#ifndef MEM_MODULE
-# define MEM_MODULE
-# if !defined (__VMS) && (defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */) )
-#   include <stdint.h>
-    typedef uint64_t U64;
-# else
-    typedef unsigned long long U64;   /* if your compiler doesn't support unsigned long long, replace by another 64-bit type here. Note that xxhash.h will also need to be updated. */
-# endif
-#endif
-
-
-#if (defined(XXH_FORCE_MEMORY_ACCESS) && (XXH_FORCE_MEMORY_ACCESS==2))
-
-/* Force direct memory access. Only works on CPU which support unaligned memory access in hardware */
-static U64 XXH_read64(const void* memPtr) { return *(const U64*) memPtr; }
-
-#elif (defined(XXH_FORCE_MEMORY_ACCESS) && (XXH_FORCE_MEMORY_ACCESS==1))
-
-/* __pack instructions are safer, but compiler specific, hence potentially problematic for some compilers */
-/* currently only defined for gcc and icc */
-typedef union { U32 u32; U64 u64; } __attribute__((packed)) unalign64;
-static U64 XXH_read64(const void* ptr) { return ((const unalign64*)ptr)->u64; }
-
-#else
-
-/* portable and safe solution. Generally efficient.
- * see : http://stackoverflow.com/a/32095106/646947
- */
-
-static U64 XXH_read64(const void* memPtr)
-{
-    U64 val;
-    memcpy(&val, memPtr, sizeof(val));
-    return val;
-}
-
-#endif   /* XXH_FORCE_DIRECT_MEMORY_ACCESS */
-
-#if defined(_MSC_VER)     /* Visual Studio */
-#  define XXH_swap64 _byteswap_uint64
-#elif XXH_GCC_VERSION >= 403
-#  define XXH_swap64 __builtin_bswap64
-#else
-static U64 XXH_swap64 (U64 x)
-{
-    return  ((x << 56) & 0xff00000000000000ULL) |
-            ((x << 40) & 0x00ff000000000000ULL) |
-            ((x << 24) & 0x0000ff0000000000ULL) |
-            ((x << 8)  & 0x000000ff00000000ULL) |
-            ((x >> 8)  & 0x00000000ff000000ULL) |
-            ((x >> 24) & 0x0000000000ff0000ULL) |
-            ((x >> 40) & 0x000000000000ff00ULL) |
-            ((x >> 56) & 0x00000000000000ffULL);
-}
-#endif
-
-FORCE_INLINE U64 XXH_readLE64_align(const void* ptr, XXH_endianess endian, XXH_alignment align)
-{
-    if (align==XXH_unaligned)
-        return endian==XXH_littleEndian ? XXH_read64(ptr) : XXH_swap64(XXH_read64(ptr));
-    else
-        return endian==XXH_littleEndian ? *(const U64*)ptr : XXH_swap64(*(const U64*)ptr);
-}
-
-FORCE_INLINE U64 XXH_readLE64(const void* ptr, XXH_endianess endian)
-{
-    return XXH_readLE64_align(ptr, endian, XXH_unaligned);
-}
-
-static U64 XXH_readBE64(const void* ptr)
-{
-    return XXH_CPU_LITTLE_ENDIAN ? XXH_swap64(XXH_read64(ptr)) : XXH_read64(ptr);
-}
-
-
-/*======   xxh64   ======*/
-
-static const U64 PRIME64_1 = 11400714785074694791ULL;
-static const U64 PRIME64_2 = 14029467366897019727ULL;
-static const U64 PRIME64_3 =  1609587929392839161ULL;
-static const U64 PRIME64_4 =  9650029242287828579ULL;
-static const U64 PRIME64_5 =  2870177450012600261ULL;
-
-static U64 XXH64_round(U64 acc, U64 input)
-{
-    acc += input * PRIME64_2;
-    acc  = XXH_rotl64(acc, 31);
-    acc *= PRIME64_1;
-    return acc;
-}
-
-static U64 XXH64_mergeRound(U64 acc, U64 val)
-{
-    val  = XXH64_round(0, val);
-    acc ^= val;
-    acc  = acc * PRIME64_1 + PRIME64_4;
-    return acc;
-}
-
-FORCE_INLINE U64 XXH64_endian_align(const void* input, size_t len, U64 seed, XXH_endianess endian, XXH_alignment align)
-{
-    const BYTE* p = (const BYTE*)input;
-    const BYTE* bEnd = p + len;
-    U64 h64;
-#define XXH_get64bits(p) XXH_readLE64_align(p, endian, align)
-
-#ifdef XXH_ACCEPT_NULL_INPUT_POINTER
-    if (p==NULL) {
-        len=0;
-        bEnd=p=(const BYTE*)(size_t)32;
-    }
-#endif
-
-    if (len>=32) {
-        const BYTE* const limit = bEnd - 32;
-        U64 v1 = seed + PRIME64_1 + PRIME64_2;
-        U64 v2 = seed + PRIME64_2;
-        U64 v3 = seed + 0;
-        U64 v4 = seed - PRIME64_1;
-
-        do {
-            v1 = XXH64_round(v1, XXH_get64bits(p)); p+=8;
-            v2 = XXH64_round(v2, XXH_get64bits(p)); p+=8;
-            v3 = XXH64_round(v3, XXH_get64bits(p)); p+=8;
-            v4 = XXH64_round(v4, XXH_get64bits(p)); p+=8;
-        } while (p<=limit);
-
-        h64 = XXH_rotl64(v1, 1) + XXH_rotl64(v2, 7) + XXH_rotl64(v3, 12) + XXH_rotl64(v4, 18);
-        h64 = XXH64_mergeRound(h64, v1);
-        h64 = XXH64_mergeRound(h64, v2);
-        h64 = XXH64_mergeRound(h64, v3);
-        h64 = XXH64_mergeRound(h64, v4);
-
-    } else {
-        h64  = seed + PRIME64_5;
-    }
-
-    h64 += (U64) len;
-
-    while (p+8<=bEnd) {
-        U64 const k1 = XXH64_round(0, XXH_get64bits(p));
-        h64 ^= k1;
-        h64  = XXH_rotl64(h64,27) * PRIME64_1 + PRIME64_4;
-        p+=8;
-    }
-
-    if (p+4<=bEnd) {
-        h64 ^= (U64)(XXH_get32bits(p)) * PRIME64_1;
-        h64 = XXH_rotl64(h64, 23) * PRIME64_2 + PRIME64_3;
-        p+=4;
-    }
-
-    while (p<bEnd) {
-        h64 ^= (*p) * PRIME64_5;
-        h64 = XXH_rotl64(h64, 11) * PRIME64_1;
-        p++;
-    }
-
-    h64 ^= h64 >> 33;
-    h64 *= PRIME64_2;
-    h64 ^= h64 >> 29;
-    h64 *= PRIME64_3;
-    h64 ^= h64 >> 32;
-
-    return h64;
-}
-
-
-XXH_PUBLIC_API unsigned long long XXH64 (const void* input, size_t len, unsigned long long seed)
-{
-#if 0
-    /* Simple version, good for code maintenance, but unfortunately slow for small inputs */
-    XXH64_state_t state;
-    XXH64_reset(&state, seed);
-    XXH64_update(&state, input, len);
-    return XXH64_digest(&state);
-#else
-    XXH_endianess endian_detected = (XXH_endianess)XXH_CPU_LITTLE_ENDIAN;
-
-    if (XXH_FORCE_ALIGN_CHECK) {
-        if ((((size_t)input) & 7)==0) {  /* Input is aligned, let's leverage the speed advantage */
-            if ((endian_detected==XXH_littleEndian) || XXH_FORCE_NATIVE_FORMAT)
-                return XXH64_endian_align(input, len, seed, XXH_littleEndian, XXH_aligned);
-            else
-                return XXH64_endian_align(input, len, seed, XXH_bigEndian, XXH_aligned);
-    }   }
-
-    if ((endian_detected==XXH_littleEndian) || XXH_FORCE_NATIVE_FORMAT)
-        return XXH64_endian_align(input, len, seed, XXH_littleEndian, XXH_unaligned);
-    else
-        return XXH64_endian_align(input, len, seed, XXH_bigEndian, XXH_unaligned);
-#endif
-}
-
-/*======   Hash Streaming   ======*/
-
-XXH_PUBLIC_API XXH64_state_t* XXH64_createState(void)
-{
-    return (XXH64_state_t*)XXH_malloc(sizeof(XXH64_state_t));
-}
-XXH_PUBLIC_API XXH_errorcode XXH64_freeState(XXH64_state_t* statePtr)
-{
-    XXH_free(statePtr);
-    return XXH_OK;
-}
-
-XXH_PUBLIC_API void XXH64_copyState(XXH64_state_t* dstState, const XXH64_state_t* srcState)
-{
-    memcpy(dstState, srcState, sizeof(*dstState));
-}
-
-XXH_PUBLIC_API XXH_errorcode XXH64_reset(XXH64_state_t* statePtr, unsigned long long seed)
-{
-    XXH64_state_t state;   /* using a local state to memcpy() in order to avoid strict-aliasing warnings */
-    memset(&state, 0, sizeof(state)-8);   /* do not write into reserved, for future removal */
-    state.v1 = seed + PRIME64_1 + PRIME64_2;
-    state.v2 = seed + PRIME64_2;
-    state.v3 = seed + 0;
-    state.v4 = seed - PRIME64_1;
-    memcpy(statePtr, &state, sizeof(state));
-    return XXH_OK;
-}
-
-FORCE_INLINE XXH_errorcode XXH64_update_endian (XXH64_state_t* state, const void* input, size_t len, XXH_endianess endian)
-{
-    const BYTE* p = (const BYTE*)input;
-    const BYTE* const bEnd = p + len;
-
-#ifdef XXH_ACCEPT_NULL_INPUT_POINTER
-    if (input==NULL) return XXH_ERROR;
-#endif
-
-    state->total_len += len;
-
-    if (state->memsize + len < 32) {  /* fill in tmp buffer */
-        XXH_memcpy(((BYTE*)state->mem64) + state->memsize, input, len);
-        state->memsize += (U32)len;
-        return XXH_OK;
-    }
-
-    if (state->memsize) {   /* tmp buffer is full */
-        XXH_memcpy(((BYTE*)state->mem64) + state->memsize, input, 32-state->memsize);
-        state->v1 = XXH64_round(state->v1, XXH_readLE64(state->mem64+0, endian));
-        state->v2 = XXH64_round(state->v2, XXH_readLE64(state->mem64+1, endian));
-        state->v3 = XXH64_round(state->v3, XXH_readLE64(state->mem64+2, endian));
-        state->v4 = XXH64_round(state->v4, XXH_readLE64(state->mem64+3, endian));
-        p += 32-state->memsize;
-        state->memsize = 0;
-    }
-
-    if (p+32 <= bEnd) {
-        const BYTE* const limit = bEnd - 32;
-        U64 v1 = state->v1;
-        U64 v2 = state->v2;
-        U64 v3 = state->v3;
-        U64 v4 = state->v4;
-
-        do {
-            v1 = XXH64_round(v1, XXH_readLE64(p, endian)); p+=8;
-            v2 = XXH64_round(v2, XXH_readLE64(p, endian)); p+=8;
-            v3 = XXH64_round(v3, XXH_readLE64(p, endian)); p+=8;
-            v4 = XXH64_round(v4, XXH_readLE64(p, endian)); p+=8;
-        } while (p<=limit);
-
-        state->v1 = v1;
-        state->v2 = v2;
-        state->v3 = v3;
-        state->v4 = v4;
-    }
-
-    if (p < bEnd) {
-        XXH_memcpy(state->mem64, p, (size_t)(bEnd-p));
-        state->memsize = (unsigned)(bEnd-p);
-    }
-
-    return XXH_OK;
-}
-
-XXH_PUBLIC_API XXH_errorcode XXH64_update (XXH64_state_t* state_in, const void* input, size_t len)
-{
-    XXH_endianess endian_detected = (XXH_endianess)XXH_CPU_LITTLE_ENDIAN;
-
-    if ((endian_detected==XXH_littleEndian) || XXH_FORCE_NATIVE_FORMAT)
-        return XXH64_update_endian(state_in, input, len, XXH_littleEndian);
-    else
-        return XXH64_update_endian(state_in, input, len, XXH_bigEndian);
-}
-
-FORCE_INLINE U64 XXH64_digest_endian (const XXH64_state_t* state, XXH_endianess endian)
-{
-    const BYTE * p = (const BYTE*)state->mem64;
-    const BYTE* const bEnd = (const BYTE*)state->mem64 + state->memsize;
-    U64 h64;
-
-    if (state->total_len >= 32) {
-        U64 const v1 = state->v1;
-        U64 const v2 = state->v2;
-        U64 const v3 = state->v3;
-        U64 const v4 = state->v4;
-
-        h64 = XXH_rotl64(v1, 1) + XXH_rotl64(v2, 7) + XXH_rotl64(v3, 12) + XXH_rotl64(v4, 18);
-        h64 = XXH64_mergeRound(h64, v1);
-        h64 = XXH64_mergeRound(h64, v2);
-        h64 = XXH64_mergeRound(h64, v3);
-        h64 = XXH64_mergeRound(h64, v4);
-    } else {
-        h64  = state->v3 + PRIME64_5;
-    }
-
-    h64 += (U64) state->total_len;
-
-    while (p+8<=bEnd) {
-        U64 const k1 = XXH64_round(0, XXH_readLE64(p, endian));
-        h64 ^= k1;
-        h64  = XXH_rotl64(h64,27) * PRIME64_1 + PRIME64_4;
-        p+=8;
-    }
-
-    if (p+4<=bEnd) {
-        h64 ^= (U64)(XXH_readLE32(p, endian)) * PRIME64_1;
-        h64  = XXH_rotl64(h64, 23) * PRIME64_2 + PRIME64_3;
-        p+=4;
-    }
-
-    while (p<bEnd) {
-        h64 ^= (*p) * PRIME64_5;
-        h64  = XXH_rotl64(h64, 11) * PRIME64_1;
-        p++;
-    }
-
-    h64 ^= h64 >> 33;
-    h64 *= PRIME64_2;
-    h64 ^= h64 >> 29;
-    h64 *= PRIME64_3;
-    h64 ^= h64 >> 32;
-
-    return h64;
-}
-
-XXH_PUBLIC_API unsigned long long XXH64_digest (const XXH64_state_t* state_in)
-{
-    XXH_endianess endian_detected = (XXH_endianess)XXH_CPU_LITTLE_ENDIAN;
-
-    if ((endian_detected==XXH_littleEndian) || XXH_FORCE_NATIVE_FORMAT)
-        return XXH64_digest_endian(state_in, XXH_littleEndian);
-    else
-        return XXH64_digest_endian(state_in, XXH_bigEndian);
-}
-
-
-/*====== Canonical representation   ======*/
-
-XXH_PUBLIC_API void XXH64_canonicalFromHash(XXH64_canonical_t* dst, XXH64_hash_t hash)
-{
-    XXH_STATIC_ASSERT(sizeof(XXH64_canonical_t) == sizeof(XXH64_hash_t));
-    if (XXH_CPU_LITTLE_ENDIAN) hash = XXH_swap64(hash);
-    memcpy(dst, &hash, sizeof(*dst));
-}
-
-XXH_PUBLIC_API XXH64_hash_t XXH64_hashFromCanonical(const XXH64_canonical_t* src)
-{
-    return XXH_readBE64(src);
-}
-
-#endif  /* XXH_NO_LONG_LONG */
diff --git a/src/plasma/thirdparty/xxhash.h b/src/plasma/thirdparty/xxhash.h
deleted file mode 100644
index 9d831e03b35f6..0000000000000
--- a/src/plasma/thirdparty/xxhash.h
+++ /dev/null
@@ -1,293 +0,0 @@
-/*
-   xxHash - Extremely Fast Hash algorithm
-   Header File
-   Copyright (C) 2012-2016, Yann Collet.
-
-   BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
-
-   Redistribution and use in source and binary forms, with or without
-   modification, are permitted provided that the following conditions are
-   met:
-
-       * Redistributions of source code must retain the above copyright
-   notice, this list of conditions and the following disclaimer.
-       * Redistributions in binary form must reproduce the above
-   copyright notice, this list of conditions and the following disclaimer
-   in the documentation and/or other materials provided with the
-   distribution.
-
-   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
-   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
-   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
-   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
-   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
-   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
-   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
-   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
-   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
-   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-   You can contact the author at :
-   - xxHash source repository : https://github.com/Cyan4973/xxHash
-*/
-
-/* Notice extracted from xxHash homepage :
-
-xxHash is an extremely fast Hash algorithm, running at RAM speed limits.
-It also successfully passes all tests from the SMHasher suite.
-
-Comparison (single thread, Windows Seven 32 bits, using SMHasher on a Core 2 Duo @3GHz)
-
-Name            Speed       Q.Score   Author
-xxHash          5.4 GB/s     10
-CrapWow         3.2 GB/s      2       Andrew
-MumurHash 3a    2.7 GB/s     10       Austin Appleby
-SpookyHash      2.0 GB/s     10       Bob Jenkins
-SBox            1.4 GB/s      9       Bret Mulvey
-Lookup3         1.2 GB/s      9       Bob Jenkins
-SuperFastHash   1.2 GB/s      1       Paul Hsieh
-CityHash64      1.05 GB/s    10       Pike & Alakuijala
-FNV             0.55 GB/s     5       Fowler, Noll, Vo
-CRC32           0.43 GB/s     9
-MD5-32          0.33 GB/s    10       Ronald L. Rivest
-SHA1-32         0.28 GB/s    10
-
-Q.Score is a measure of quality of the hash function.
-It depends on successfully passing SMHasher test set.
-10 is a perfect score.
-
-A 64-bits version, named XXH64, is available since r35.
-It offers much better speed, but for 64-bits applications only.
-Name     Speed on 64 bits    Speed on 32 bits
-XXH64       13.8 GB/s            1.9 GB/s
-XXH32        6.8 GB/s            6.0 GB/s
-*/
-
-#ifndef XXHASH_H_5627135585666179
-#define XXHASH_H_5627135585666179 1
-
-#if defined (__cplusplus)
-extern "C" {
-#endif
-
-
-/* ****************************
-*  Definitions
-******************************/
-#include <stddef.h>   /* size_t */
-typedef enum { XXH_OK=0, XXH_ERROR } XXH_errorcode;
-
-
-/* ****************************
-*  API modifier
-******************************/
-/** XXH_PRIVATE_API
-*   This is useful to include xxhash functions in `static` mode
-*   in order to inline them, and remove their symbol from the public list.
-*   Methodology :
-*     #define XXH_PRIVATE_API
-*     #include "xxhash.h"
-*   `xxhash.c` is automatically included.
-*   It's not useful to compile and link it as a separate module.
-*/
-#ifdef XXH_PRIVATE_API
-#  ifndef XXH_STATIC_LINKING_ONLY
-#    define XXH_STATIC_LINKING_ONLY
-#  endif
-#  if defined(__GNUC__)
-#    define XXH_PUBLIC_API static __inline __attribute__((unused))
-#  elif defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */)
-#    define XXH_PUBLIC_API static inline
-#  elif defined(_MSC_VER)
-#    define XXH_PUBLIC_API static __inline
-#  else
-#    define XXH_PUBLIC_API static   /* this version may generate warnings for unused static functions; disable the relevant warning */
-#  endif
-#else
-#  define XXH_PUBLIC_API   /* do nothing */
-#endif /* XXH_PRIVATE_API */
-
-/*!XXH_NAMESPACE, aka Namespace Emulation :
-
-If you want to include _and expose_ xxHash functions from within your own library,
-but also want to avoid symbol collisions with other libraries which may also include xxHash,
-
-you can use XXH_NAMESPACE, to automatically prefix any public symbol from xxhash library
-with the value of XXH_NAMESPACE (therefore, avoid NULL and numeric values).
-
-Note that no change is required within the calling program as long as it includes `xxhash.h` :
-regular symbol name will be automatically translated by this header.
-*/
-#ifdef XXH_NAMESPACE
-#  define XXH_CAT(A,B) A##B
-#  define XXH_NAME2(A,B) XXH_CAT(A,B)
-#  define XXH_versionNumber XXH_NAME2(XXH_NAMESPACE, XXH_versionNumber)
-#  define XXH32 XXH_NAME2(XXH_NAMESPACE, XXH32)
-#  define XXH32_createState XXH_NAME2(XXH_NAMESPACE, XXH32_createState)
-#  define XXH32_freeState XXH_NAME2(XXH_NAMESPACE, XXH32_freeState)
-#  define XXH32_reset XXH_NAME2(XXH_NAMESPACE, XXH32_reset)
-#  define XXH32_update XXH_NAME2(XXH_NAMESPACE, XXH32_update)
-#  define XXH32_digest XXH_NAME2(XXH_NAMESPACE, XXH32_digest)
-#  define XXH32_copyState XXH_NAME2(XXH_NAMESPACE, XXH32_copyState)
-#  define XXH32_canonicalFromHash XXH_NAME2(XXH_NAMESPACE, XXH32_canonicalFromHash)
-#  define XXH32_hashFromCanonical XXH_NAME2(XXH_NAMESPACE, XXH32_hashFromCanonical)
-#  define XXH64 XXH_NAME2(XXH_NAMESPACE, XXH64)
-#  define XXH64_createState XXH_NAME2(XXH_NAMESPACE, XXH64_createState)
-#  define XXH64_freeState XXH_NAME2(XXH_NAMESPACE, XXH64_freeState)
-#  define XXH64_reset XXH_NAME2(XXH_NAMESPACE, XXH64_reset)
-#  define XXH64_update XXH_NAME2(XXH_NAMESPACE, XXH64_update)
-#  define XXH64_digest XXH_NAME2(XXH_NAMESPACE, XXH64_digest)
-#  define XXH64_copyState XXH_NAME2(XXH_NAMESPACE, XXH64_copyState)
-#  define XXH64_canonicalFromHash XXH_NAME2(XXH_NAMESPACE, XXH64_canonicalFromHash)
-#  define XXH64_hashFromCanonical XXH_NAME2(XXH_NAMESPACE, XXH64_hashFromCanonical)
-#endif
-
-
-/* *************************************
-*  Version
-***************************************/
-#define XXH_VERSION_MAJOR    0
-#define XXH_VERSION_MINOR    6
-#define XXH_VERSION_RELEASE  2
-#define XXH_VERSION_NUMBER  (XXH_VERSION_MAJOR *100*100 + XXH_VERSION_MINOR *100 + XXH_VERSION_RELEASE)
-XXH_PUBLIC_API unsigned XXH_versionNumber (void);
-
-
-/*-**********************************************************************
-*  32-bits hash
-************************************************************************/
-typedef unsigned int XXH32_hash_t;
-
-/*! XXH32() :
-    Calculate the 32-bits hash of sequence "length" bytes stored at memory address "input".
-    The memory between input & input+length must be valid (allocated and read-accessible).
-    "seed" can be used to alter the result predictably.
-    Speed on Core 2 Duo @ 3 GHz (single thread, SMHasher benchmark) : 5.4 GB/s */
-XXH_PUBLIC_API XXH32_hash_t XXH32 (const void* input, size_t length, unsigned int seed);
-
-/*======   Streaming   ======*/
-typedef struct XXH32_state_s XXH32_state_t;   /* incomplete type */
-XXH_PUBLIC_API XXH32_state_t* XXH32_createState(void);
-XXH_PUBLIC_API XXH_errorcode  XXH32_freeState(XXH32_state_t* statePtr);
-XXH_PUBLIC_API void XXH32_copyState(XXH32_state_t* dst_state, const XXH32_state_t* src_state);
-
-XXH_PUBLIC_API XXH_errorcode XXH32_reset  (XXH32_state_t* statePtr, unsigned int seed);
-XXH_PUBLIC_API XXH_errorcode XXH32_update (XXH32_state_t* statePtr, const void* input, size_t length);
-XXH_PUBLIC_API XXH32_hash_t  XXH32_digest (const XXH32_state_t* statePtr);
-
-/*
-These functions generate the xxHash of an input provided in multiple segments.
-Note that, for small input, they are slower than single-call functions, due to state management.
-For small input, prefer `XXH32()` and `XXH64()` .
-
-XXH state must first be allocated, using XXH*_createState() .
-
-Start a new hash by initializing state with a seed, using XXH*_reset().
-
-Then, feed the hash state by calling XXH*_update() as many times as necessary.
-Obviously, input must be allocated and read accessible.
-The function returns an error code, with 0 meaning OK, and any other value meaning there is an error.
-
-Finally, a hash value can be produced anytime, by using XXH*_digest().
-This function returns the nn-bits hash as an int or long long.
-
-It's still possible to continue inserting input into the hash state after a digest,
-and generate some new hashes later on, by calling again XXH*_digest().
-
-When done, free XXH state space if it was allocated dynamically.
-*/
-
-/*======   Canonical representation   ======*/
-
-typedef struct { unsigned char digest[4]; } XXH32_canonical_t;
-XXH_PUBLIC_API void XXH32_canonicalFromHash(XXH32_canonical_t* dst, XXH32_hash_t hash);
-XXH_PUBLIC_API XXH32_hash_t XXH32_hashFromCanonical(const XXH32_canonical_t* src);
-
-/* Default result type for XXH functions are primitive unsigned 32 and 64 bits.
-*  The canonical representation uses human-readable write convention, aka big-endian (large digits first).
-*  These functions allow transformation of hash result into and from its canonical format.
-*  This way, hash values can be written into a file / memory, and remain comparable on different systems and programs.
-*/
-
-
-#ifndef XXH_NO_LONG_LONG
-/*-**********************************************************************
-*  64-bits hash
-************************************************************************/
-typedef unsigned long long XXH64_hash_t;
-
-/*! XXH64() :
-    Calculate the 64-bits hash of sequence of length "len" stored at memory address "input".
-    "seed" can be used to alter the result predictably.
-    This function runs faster on 64-bits systems, but slower on 32-bits systems (see benchmark).
-*/
-XXH_PUBLIC_API XXH64_hash_t XXH64 (const void* input, size_t length, unsigned long long seed);
-
-/*======   Streaming   ======*/
-typedef struct XXH64_state_s XXH64_state_t;   /* incomplete type */
-XXH_PUBLIC_API XXH64_state_t* XXH64_createState(void);
-XXH_PUBLIC_API XXH_errorcode  XXH64_freeState(XXH64_state_t* statePtr);
-XXH_PUBLIC_API void XXH64_copyState(XXH64_state_t* dst_state, const XXH64_state_t* src_state);
-
-XXH_PUBLIC_API XXH_errorcode XXH64_reset  (XXH64_state_t* statePtr, unsigned long long seed);
-XXH_PUBLIC_API XXH_errorcode XXH64_update (XXH64_state_t* statePtr, const void* input, size_t length);
-XXH_PUBLIC_API XXH64_hash_t  XXH64_digest (const XXH64_state_t* statePtr);
-
-/*======   Canonical representation   ======*/
-typedef struct { unsigned char digest[8]; } XXH64_canonical_t;
-XXH_PUBLIC_API void XXH64_canonicalFromHash(XXH64_canonical_t* dst, XXH64_hash_t hash);
-XXH_PUBLIC_API XXH64_hash_t XXH64_hashFromCanonical(const XXH64_canonical_t* src);
-#endif  /* XXH_NO_LONG_LONG */
-
-
-#ifdef XXH_STATIC_LINKING_ONLY
-
-/* ================================================================================================
-   This section contains definitions which are not guaranteed to remain stable.
-   They may change in future versions, becoming incompatible with a different version of the library.
-   They shall only be used with static linking.
-   Never use these definitions in association with dynamic linking !
-=================================================================================================== */
-
-/* These definitions are only meant to make possible
-   static allocation of XXH state, on stack or in a struct for example.
-   Never use members directly. */
-
-struct XXH32_state_s {
-   unsigned total_len_32;
-   unsigned large_len;
-   unsigned v1;
-   unsigned v2;
-   unsigned v3;
-   unsigned v4;
-   unsigned mem32[4];   /* buffer defined as U32 for alignment */
-   unsigned memsize;
-   unsigned reserved;   /* never read nor write, will be removed in a future version */
-};   /* typedef'd to XXH32_state_t */
-
-#ifndef XXH_NO_LONG_LONG   /* remove 64-bits support */
-struct XXH64_state_s {
-   unsigned long long total_len;
-   unsigned long long v1;
-   unsigned long long v2;
-   unsigned long long v3;
-   unsigned long long v4;
-   unsigned long long mem64[4];   /* buffer defined as U64 for alignment */
-   unsigned memsize;
-   unsigned reserved[2];          /* never read nor write, will be removed in a future version */
-};   /* typedef'd to XXH64_state_t */
-#endif
-
-#ifdef XXH_PRIVATE_API
-#  include "xxhash.c"   /* include xxhash function bodies as `static`, for inlining */
-#endif
-
-#endif /* XXH_STATIC_LINKING_ONLY */
-
-
-#if defined (__cplusplus)
-}
-#endif
-
-#endif /* XXHASH_H_5627135585666179 */
diff --git a/src/ray/.clang-format b/src/ray/.clang-format
deleted file mode 100644
index 5c0f059e15f3f..0000000000000
--- a/src/ray/.clang-format
+++ /dev/null
@@ -1,5 +0,0 @@
-BasedOnStyle: Google
-ColumnLimit: 90
-DerivePointerAlignment: false
-IndentCaseLabels: false
-PointerAlignment: Right
diff --git a/src/ray/CMakeLists.txt b/src/ray/CMakeLists.txt
index 526bc20a94d3b..3916423a6f261 100644
--- a/src/ray/CMakeLists.txt
+++ b/src/ray/CMakeLists.txt
@@ -6,24 +6,20 @@ add_subdirectory(gcs)
 add_subdirectory(object_manager)
 add_subdirectory(raylet)
 
-include_directories(${CMAKE_SOURCE_DIR}/src/common/thirdparty/ae)
-
-set(AE_SRCS
-  ${CMAKE_CURRENT_LIST_DIR}/../common/thirdparty/ae/ae.c
-)
+include_directories(thirdparty/ae)
 
 set(HIREDIS_SRCS
-  ${CMAKE_CURRENT_LIST_DIR}/../common/thirdparty/hiredis/async.c
-  ${CMAKE_CURRENT_LIST_DIR}/../common/thirdparty/hiredis/dict.c
-  ${CMAKE_CURRENT_LIST_DIR}/../common/thirdparty/hiredis/hiredis.c
-  ${CMAKE_CURRENT_LIST_DIR}/../common/thirdparty/hiredis/net.c
-  ${CMAKE_CURRENT_LIST_DIR}/../common/thirdparty/hiredis/read.c
-  ${CMAKE_CURRENT_LIST_DIR}/../common/thirdparty/hiredis/sds.c
+  ${CMAKE_CURRENT_LIST_DIR}/thirdparty/hiredis/async.c
+  ${CMAKE_CURRENT_LIST_DIR}/thirdparty/hiredis/dict.c
+  ${CMAKE_CURRENT_LIST_DIR}/thirdparty/hiredis/hiredis.c
+  ${CMAKE_CURRENT_LIST_DIR}/thirdparty/hiredis/net.c
+  ${CMAKE_CURRENT_LIST_DIR}/thirdparty/hiredis/read.c
+  ${CMAKE_CURRENT_LIST_DIR}/thirdparty/hiredis/sds.c
 )
 
 set(UTIL_SRCS
-  ${CMAKE_CURRENT_LIST_DIR}/../common/thirdparty/sha256.c
-  ${CMAKE_CURRENT_LIST_DIR}/../common/common_protocol.cc
+  ${CMAKE_CURRENT_LIST_DIR}/thirdparty/sha256.c
+  ${CMAKE_CURRENT_LIST_DIR}/common/common_protocol.cc
 )
 
 set(RAY_SRCS
@@ -31,11 +27,11 @@ set(RAY_SRCS
   status.cc
   gcs/client.cc
   gcs/tables.cc
-  gcs/task_table.cc
   gcs/redis_context.cc
   gcs/asio.cc
   util/logging.cc
   common/client_connection.cc
+  common/common_protocol.cc
   object_manager/object_manager_client_connection.cc
   object_manager/connection_pool.cc
   object_manager/object_buffer_pool.cc
@@ -65,13 +61,11 @@ set(RAY_LIB_DEPENDENCIES
     arrow_ep
     gen_gcs_fbs
     gen_object_manager_fbs
-    gen_node_manager_fbs
-    gen_local_scheduler_fbs
-    gen_common_fbs)
+    gen_node_manager_fbs)
 
 if(RAY_USE_GLOG)
-  set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DRAY_USE_GLOG")
-  set(RAY_LIB_STATIC_LINK_LIBS ${RAY_LIB_STATIC_LINK_LIBS} ${GLOG_STATIC_LIB})
+  add_definitions(-DRAY_USE_GLOG)
+  set(RAY_LIB_STATIC_LINK_LIBS ${RAY_LIB_STATIC_LINK_LIBS} glog)
   set(RAY_LIB_DEPENDENCIES ${RAY_LIB_DEPENDENCIES} glog)
 endif()
 
@@ -90,9 +84,15 @@ install(
   DESTINATION "${CMAKE_INSTALL_LIBDIR}/pkgconfig/")
 
 ADD_RAY_LIB(ray
-  SOURCES ${RAY_SRCS} ${AE_SRCS} ${HIREDIS_SRCS} ${UTIL_SRCS}
-    # TODO: When raylet replaces the old backend, please remove the dependency gen_local_scheduler_fbs.
-    # TODO: When remove the included Task.h from table.h, please remove the dependency gen_common_python_fbs.
+  SOURCES ${RAY_SRCS} ${HIREDIS_SRCS} ${UTIL_SRCS}
     DEPENDENCIES ${RAY_LIB_DEPENDENCIES}
     SHARED_LINK_LIBS ""
     STATIC_LINK_LIBS ${RAY_LIB_STATIC_LINK_LIBS})
+
+add_custom_target(copy_redis ALL)
+foreach(file "redis-cli" "redis-server")
+add_custom_command(TARGET copy_redis POST_BUILD
+                   COMMAND ${CMAKE_COMMAND} -E
+                      copy ${CMAKE_CURRENT_LIST_DIR}/../../thirdparty/pkg/redis/src/${file}
+                           ${CMAKE_BINARY_DIR}/src/ray/thirdparty/redis/src/${file})
+endforeach()
diff --git a/src/ray/common/client_connection.cc b/src/ray/common/client_connection.cc
index eaa4794292708..1ae225443fc36 100644
--- a/src/ray/common/client_connection.cc
+++ b/src/ray/common/client_connection.cc
@@ -1,8 +1,9 @@
 #include "client_connection.h"
 
+#include <stdio.h>
 #include <boost/bind.hpp>
 
-#include "common.h"
+#include "ray/ray_config.h"
 #include "ray/raylet/format/node_manager_generated.h"
 #include "ray/util/util.h"
 
@@ -18,9 +19,19 @@ ray::Status TcpConnect(boost::asio::ip::tcp::socket &socket,
   return boost_to_ray_status(error);
 }
 
+template <class T>
+std::shared_ptr<ServerConnection<T>> ServerConnection<T>::Create(
+    boost::asio::basic_stream_socket<T> &&socket) {
+  std::shared_ptr<ServerConnection<T>> self(new ServerConnection(std::move(socket)));
+  return self;
+}
+
 template <class T>
 ServerConnection<T>::ServerConnection(boost::asio::basic_stream_socket<T> &&socket)
-    : socket_(std::move(socket)) {}
+    : socket_(std::move(socket)),
+      async_write_max_messages_(1),
+      async_write_queue_(),
+      async_write_in_flight_(false) {}
 
 template <class T>
 Status ServerConnection<T>::WriteBuffer(
@@ -72,17 +83,92 @@ void ServerConnection<T>::ReadBuffer(
 template <class T>
 ray::Status ServerConnection<T>::WriteMessage(int64_t type, int64_t length,
                                               const uint8_t *message) {
+  sync_writes_ += 1;
+  bytes_written_ += length;
+
   std::vector<boost::asio::const_buffer> message_buffers;
   auto write_version = RayConfig::instance().ray_protocol_version();
   message_buffers.push_back(boost::asio::buffer(&write_version, sizeof(write_version)));
   message_buffers.push_back(boost::asio::buffer(&type, sizeof(type)));
   message_buffers.push_back(boost::asio::buffer(&length, sizeof(length)));
   message_buffers.push_back(boost::asio::buffer(message, length));
-  // Write the message and then wait for more messages.
-  // TODO(swang): Does this need to be an async write?
   return WriteBuffer(message_buffers);
 }
 
+template <class T>
+void ServerConnection<T>::WriteMessageAsync(
+    int64_t type, int64_t length, const uint8_t *message,
+    const std::function<void(const ray::Status &)> &handler) {
+  async_writes_ += 1;
+  bytes_written_ += length;
+
+  auto write_buffer = std::unique_ptr<AsyncWriteBuffer>(new AsyncWriteBuffer());
+  write_buffer->write_version = RayConfig::instance().ray_protocol_version();
+  write_buffer->write_type = type;
+  write_buffer->write_length = length;
+  write_buffer->write_message.resize(length);
+  write_buffer->write_message.assign(message, message + length);
+  write_buffer->handler = handler;
+
+  auto size = async_write_queue_.size();
+  auto size_is_power_of_two = (size & (size - 1)) == 0;
+  if (size > 1000 && size_is_power_of_two) {
+    RAY_LOG(WARNING) << "ServerConnection has " << size << " buffered async writes";
+  }
+
+  async_write_queue_.push_back(std::move(write_buffer));
+
+  if (!async_write_in_flight_) {
+    DoAsyncWrites();
+  }
+}
+
+template <class T>
+void ServerConnection<T>::DoAsyncWrites() {
+  // Make sure we were not writing to the socket.
+  RAY_CHECK(!async_write_in_flight_);
+  async_write_in_flight_ = true;
+
+  // Do an async write of everything currently in the queue to the socket.
+  std::vector<boost::asio::const_buffer> message_buffers;
+  int num_messages = 0;
+  for (const auto &write_buffer : async_write_queue_) {
+    message_buffers.push_back(boost::asio::buffer(&write_buffer->write_version,
+                                                  sizeof(write_buffer->write_version)));
+    message_buffers.push_back(
+        boost::asio::buffer(&write_buffer->write_type, sizeof(write_buffer->write_type)));
+    message_buffers.push_back(boost::asio::buffer(&write_buffer->write_length,
+                                                  sizeof(write_buffer->write_length)));
+    message_buffers.push_back(boost::asio::buffer(write_buffer->write_message));
+    num_messages++;
+    if (num_messages >= async_write_max_messages_) {
+      break;
+    }
+  }
+  auto this_ptr = this->shared_from_this();
+  boost::asio::async_write(
+      ServerConnection<T>::socket_, message_buffers,
+      [this, this_ptr, num_messages](const boost::system::error_code &error,
+                                     size_t bytes_transferred) {
+        ray::Status status = ray::Status::OK();
+        if (error.value() != boost::system::errc::errc_t::success) {
+          status = boost_to_ray_status(error);
+        }
+        // Call the handlers for the written messages.
+        for (int i = 0; i < num_messages; i++) {
+          auto write_buffer = std::move(async_write_queue_.front());
+          write_buffer->handler(status);
+          async_write_queue_.pop_front();
+        }
+        // We finished writing, so mark that we're no longer doing an async write.
+        async_write_in_flight_ = false;
+        // If there is more to write, try to write the rest.
+        if (!async_write_queue_.empty()) {
+          DoAsyncWrites();
+        }
+      });
+}
+
 template <class T>
 std::shared_ptr<ClientConnection<T>> ClientConnection<T>::Create(
     ClientHandler<T> &client_handler, MessageHandler<T> &message_handler,
@@ -103,7 +189,7 @@ ClientConnection<T>::ClientConnection(MessageHandler<T> &message_handler,
       debug_label_(debug_label) {}
 
 template <class T>
-const ClientID &ClientConnection<T>::GetClientID() {
+const ClientID &ClientConnection<T>::GetClientId() {
   return client_id_;
 }
 
@@ -122,8 +208,8 @@ void ClientConnection<T>::ProcessMessages() {
   header.push_back(boost::asio::buffer(&read_length_, sizeof(read_length_)));
   boost::asio::async_read(
       ServerConnection<T>::socket_, header,
-      boost::bind(&ClientConnection<T>::ProcessMessageHeader, this->shared_from_this(),
-                  boost::asio::placeholders::error));
+      boost::bind(&ClientConnection<T>::ProcessMessageHeader,
+                  shared_ClientConnection_from_this(), boost::asio::placeholders::error));
 }
 
 template <class T>
@@ -140,11 +226,12 @@ void ClientConnection<T>::ProcessMessageHeader(const boost::system::error_code &
   RAY_CHECK(read_version_ == RayConfig::instance().ray_protocol_version());
   // Resize the message buffer to match the received length.
   read_message_.resize(read_length_);
+  ServerConnection<T>::bytes_read_ += read_length_;
   // Wait for the message to be read.
   boost::asio::async_read(
       ServerConnection<T>::socket_, boost::asio::buffer(read_message_),
-      boost::bind(&ClientConnection<T>::ProcessMessage, this->shared_from_this(),
-                  boost::asio::placeholders::error));
+      boost::bind(&ClientConnection<T>::ProcessMessage,
+                  shared_ClientConnection_from_this(), boost::asio::placeholders::error));
 }
 
 template <class T>
@@ -153,13 +240,29 @@ void ClientConnection<T>::ProcessMessage(const boost::system::error_code &error)
     read_type_ = static_cast<int64_t>(protocol::MessageType::DisconnectClient);
   }
 
-  uint64_t start_ms = current_time_ms();
-  message_handler_(this->shared_from_this(), read_type_, read_message_.data());
-  uint64_t interval = current_time_ms() - start_ms;
+  int64_t start_ms = current_time_ms();
+  message_handler_(shared_ClientConnection_from_this(), read_type_, read_message_.data());
+  int64_t interval = current_time_ms() - start_ms;
   if (interval > RayConfig::instance().handler_warning_timeout_ms()) {
     RAY_LOG(WARNING) << "[" << debug_label_ << "]ProcessMessage with type " << read_type_
-                     << " took " << interval << " ms ";
+                     << " took " << interval << " ms.";
+  }
+}
+
+template <class T>
+std::string ServerConnection<T>::DebugString() const {
+  std::stringstream result;
+  result << "\n- bytes read: " << bytes_read_;
+  result << "\n- bytes written: " << bytes_written_;
+  result << "\n- num async writes: " << async_writes_;
+  result << "\n- num sync writes: " << sync_writes_;
+  result << "\n- writing: " << async_write_in_flight_;
+  int64_t num_bytes = 0;
+  for (auto &buffer : async_write_queue_) {
+    num_bytes += buffer->write_length;
   }
+  result << "\n- pending async bytes: " << num_bytes;
+  return result.str();
 }
 
 template class ServerConnection<boost::asio::local::stream_protocol>;
diff --git a/src/ray/common/client_connection.h b/src/ray/common/client_connection.h
index 39d3c084d80f2..d4ca993d26a4b 100644
--- a/src/ray/common/client_connection.h
+++ b/src/ray/common/client_connection.h
@@ -1,6 +1,7 @@
 #ifndef RAY_COMMON_CLIENT_CONNECTION_H
 #define RAY_COMMON_CLIENT_CONNECTION_H
 
+#include <deque>
 #include <memory>
 
 #include <boost/asio.hpp>
@@ -26,10 +27,14 @@ ray::Status TcpConnect(boost::asio::ip::tcp::socket &socket,
 /// A generic type representing a client connection to a server. This typename
 /// can be used to write messages synchronously to the server.
 template <typename T>
-class ServerConnection {
+class ServerConnection : public std::enable_shared_from_this<ServerConnection<T>> {
  public:
-  /// Create a connection to the server.
-  ServerConnection(boost::asio::basic_stream_socket<T> &&socket);
+  /// Allocate a new server connection.
+  ///
+  /// \param socket A reference to the server socket.
+  /// \return std::shared_ptr<ServerConnection>.
+  static std::shared_ptr<ServerConnection<T>> Create(
+      boost::asio::basic_stream_socket<T> &&socket);
 
   /// Write a message to the client.
   ///
@@ -39,6 +44,15 @@ class ServerConnection {
   /// \return Status.
   ray::Status WriteMessage(int64_t type, int64_t length, const uint8_t *message);
 
+  /// Write a message to the client asynchronously.
+  ///
+  /// \param type The message type (e.g., a flatbuffer enum).
+  /// \param length The size in bytes of the message.
+  /// \param message A pointer to the message buffer.
+  /// \param handler A callback to run on write completion.
+  void WriteMessageAsync(int64_t type, int64_t length, const uint8_t *message,
+                         const std::function<void(const ray::Status &)> &handler);
+
   /// Write a buffer to this connection.
   ///
   /// \param buffer The buffer.
@@ -52,9 +66,56 @@ class ServerConnection {
   void ReadBuffer(const std::vector<boost::asio::mutable_buffer> &buffer,
                   boost::system::error_code &ec);
 
+  /// Shuts down socket for this connection.
+  void Close() {
+    boost::system::error_code ec;
+    socket_.close(ec);
+  }
+
+  std::string DebugString() const;
+
  protected:
+  /// A private constructor for a server connection.
+  ServerConnection(boost::asio::basic_stream_socket<T> &&socket);
+
+  /// A message that is queued for writing asynchronously.
+  struct AsyncWriteBuffer {
+    int64_t write_version;
+    int64_t write_type;
+    uint64_t write_length;
+    std::vector<uint8_t> write_message;
+    std::function<void(const ray::Status &)> handler;
+  };
+
   /// The socket connection to the server.
   boost::asio::basic_stream_socket<T> socket_;
+
+  /// Max number of messages to write out at once.
+  const int async_write_max_messages_;
+
+  /// List of pending messages to write.
+  std::deque<std::unique_ptr<AsyncWriteBuffer>> async_write_queue_;
+
+  /// Whether we are in the middle of an async write.
+  bool async_write_in_flight_;
+
+  /// Count of async messages sent total.
+  int64_t async_writes_ = 0;
+
+  /// Count of sync messages sent total.
+  int64_t sync_writes_ = 0;
+
+  /// Count of bytes sent total.
+  int64_t bytes_written_ = 0;
+
+  /// Count of bytes read total.
+  int64_t bytes_read_ = 0;
+
+ private:
+  /// Asynchronously flushes the write queue. While async writes are running, the flag
+  /// async_write_in_flight_ will be set. This should only be called when no async writes
+  /// are currently in flight.
+  void DoAsyncWrites();
 };
 
 template <typename T>
@@ -72,9 +133,10 @@ using MessageHandler =
 /// writing messages to the client, like in ServerConnection, this typename can
 /// also be used to process messages asynchronously from client.
 template <typename T>
-class ClientConnection : public ServerConnection<T>,
-                         public std::enable_shared_from_this<ClientConnection<T>> {
+class ClientConnection : public ServerConnection<T> {
  public:
+  using std::enable_shared_from_this<ServerConnection<T>>::shared_from_this;
+
   /// Allocate a new node client connection.
   ///
   /// \param new_client_handler A reference to the client handler.
@@ -85,8 +147,12 @@ class ClientConnection : public ServerConnection<T>,
       ClientHandler<T> &new_client_handler, MessageHandler<T> &message_handler,
       boost::asio::basic_stream_socket<T> &&socket, const std::string &debug_label);
 
+  std::shared_ptr<ClientConnection<T>> shared_ClientConnection_from_this() {
+    return std::static_pointer_cast<ClientConnection<T>>(shared_from_this());
+  }
+
   /// \return The ClientID of the remote client.
-  const ClientID &GetClientID();
+  const ClientID &GetClientId();
 
   /// \param client_id The ClientID of the remote client.
   void SetClientID(const ClientID &client_id);
@@ -114,7 +180,7 @@ class ClientConnection : public ServerConnection<T>,
   MessageHandler<T> message_handler_;
   /// A label used for debug messages.
   const std::string debug_label_;
-  /// Buffers for the current message being read rom the client.
+  /// Buffers for the current message being read from the client.
   int64_t read_version_;
   int64_t read_type_;
   uint64_t read_length_;
diff --git a/src/common/common_protocol.cc b/src/ray/common/common_protocol.cc
similarity index 82%
rename from src/common/common_protocol.cc
rename to src/ray/common/common_protocol.cc
index 05f5c2a2f36e2..5ce4c89d62120 100644
--- a/src/common/common_protocol.cc
+++ b/src/ray/common/common_protocol.cc
@@ -1,8 +1,9 @@
 #include "common_protocol.h"
 
-flatbuffers::Offset<flatbuffers::String> to_flatbuf(
-    flatbuffers::FlatBufferBuilder &fbb,
-    ray::ObjectID object_id) {
+#include "ray/util/logging.h"
+
+flatbuffers::Offset<flatbuffers::String> to_flatbuf(flatbuffers::FlatBufferBuilder &fbb,
+                                                    ray::ObjectID object_id) {
   return fbb.CreateString(reinterpret_cast<const char *>(object_id.data()),
                           sizeof(ray::ObjectID));
 }
@@ -15,8 +16,7 @@ ray::ObjectID from_flatbuf(const flatbuffers::String &string) {
 }
 
 const std::vector<ray::ObjectID> from_flatbuf(
-    const flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>>
-        &vector) {
+    const flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>> &vector) {
   std::vector<ray::ObjectID> object_ids;
   for (int64_t i = 0; i < vector.Length(); i++) {
     object_ids.push_back(from_flatbuf(*vector.Get(i)));
@@ -24,10 +24,8 @@ const std::vector<ray::ObjectID> from_flatbuf(
   return object_ids;
 }
 
-flatbuffers::Offset<
-    flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>>>
-to_flatbuf(flatbuffers::FlatBufferBuilder &fbb,
-           ray::ObjectID object_ids[],
+flatbuffers::Offset<flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>>>
+to_flatbuf(flatbuffers::FlatBufferBuilder &fbb, ray::ObjectID object_ids[],
            int64_t num_objects) {
   std::vector<flatbuffers::Offset<flatbuffers::String>> results;
   for (int64_t i = 0; i < num_objects; i++) {
@@ -36,8 +34,7 @@ to_flatbuf(flatbuffers::FlatBufferBuilder &fbb,
   return fbb.CreateVector(results);
 }
 
-flatbuffers::Offset<
-    flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>>>
+flatbuffers::Offset<flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>>>
 to_flatbuf(flatbuffers::FlatBufferBuilder &fbb,
            const std::vector<ray::ObjectID> &object_ids) {
   std::vector<flatbuffers::Offset<flatbuffers::String>> results;
@@ -52,8 +49,7 @@ std::string string_from_flatbuf(const flatbuffers::String &string) {
 }
 
 const std::unordered_map<std::string, double> map_from_flatbuf(
-    const flatbuffers::Vector<flatbuffers::Offset<ResourcePair>>
-        &resource_vector) {
+    const flatbuffers::Vector<flatbuffers::Offset<ResourcePair>> &resource_vector) {
   std::unordered_map<std::string, double> required_resources;
   for (int64_t i = 0; i < resource_vector.size(); i++) {
     const ResourcePair *resource_pair = resource_vector.Get(i);
diff --git a/src/common/common_protocol.h b/src/ray/common/common_protocol.h
similarity index 82%
rename from src/common/common_protocol.h
rename to src/ray/common/common_protocol.h
index 6c2c177dd60bc..3afa6b8e5781c 100644
--- a/src/common/common_protocol.h
+++ b/src/ray/common/common_protocol.h
@@ -1,22 +1,19 @@
 #ifndef COMMON_PROTOCOL_H
 #define COMMON_PROTOCOL_H
 
-#include "format/common_generated.h"
+#include "ray/gcs/format/gcs_generated.h"
 
 #include <unordered_map>
 
-#include "common.h"
-
-#define DB_CLIENT_PREFIX "CL:"
+#include "ray/id.h"
 
 /// Convert an object ID to a flatbuffer string.
 ///
 /// @param fbb Reference to the flatbuffer builder.
 /// @param object_id The object ID to be converted.
 /// @return The flatbuffer string contining the object ID.
-flatbuffers::Offset<flatbuffers::String> to_flatbuf(
-    flatbuffers::FlatBufferBuilder &fbb,
-    ray::ObjectID object_id);
+flatbuffers::Offset<flatbuffers::String> to_flatbuf(flatbuffers::FlatBufferBuilder &fbb,
+                                                    ray::ObjectID object_id);
 
 /// Convert a flatbuffer string to an object ID.
 ///
@@ -29,8 +26,7 @@ ray::ObjectID from_flatbuf(const flatbuffers::String &string);
 /// @param vector The flatbuffer vector.
 /// @return The vector of object IDs.
 const std::vector<ray::ObjectID> from_flatbuf(
-    const flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>>
-        &vector);
+    const flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>> &vector);
 
 /// Convert an array of object IDs to a flatbuffer vector of strings.
 ///
@@ -38,10 +34,8 @@ const std::vector<ray::ObjectID> from_flatbuf(
 /// @param object_ids Array of object IDs.
 /// @param num_objects Number of elements in the array.
 /// @return Flatbuffer vector of strings.
-flatbuffers::Offset<
-    flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>>>
-to_flatbuf(flatbuffers::FlatBufferBuilder &fbb,
-           ray::ObjectID object_ids[],
+flatbuffers::Offset<flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>>>
+to_flatbuf(flatbuffers::FlatBufferBuilder &fbb, ray::ObjectID object_ids[],
            int64_t num_objects);
 
 /// Convert a vector of object IDs to a flatbuffer vector of strings.
@@ -49,8 +43,7 @@ to_flatbuf(flatbuffers::FlatBufferBuilder &fbb,
 /// @param fbb Reference to the flatbuffer builder.
 /// @param object_ids Vector of object IDs.
 /// @return Flatbuffer vector of strings.
-flatbuffers::Offset<
-    flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>>>
+flatbuffers::Offset<flatbuffers::Vector<flatbuffers::Offset<flatbuffers::String>>>
 to_flatbuf(flatbuffers::FlatBufferBuilder &fbb,
            const std::vector<ray::ObjectID> &object_ids);
 
@@ -77,7 +70,6 @@ map_to_flatbuf(flatbuffers::FlatBufferBuilder &fbb,
 /// @param resource_vector The flatbuffer object.
 /// @return A map from resource name to resource quantity.
 const std::unordered_map<std::string, double> map_from_flatbuf(
-    const flatbuffers::Vector<flatbuffers::Offset<ResourcePair>>
-        &resource_vector);
+    const flatbuffers::Vector<flatbuffers::Offset<ResourcePair>> &resource_vector);
 
 #endif
diff --git a/src/ray/gcs/CMakeLists.txt b/src/ray/gcs/CMakeLists.txt
index 1d4db67af8d46..0fd0077378d81 100644
--- a/src/ray/gcs/CMakeLists.txt
+++ b/src/ray/gcs/CMakeLists.txt
@@ -1,6 +1,9 @@
 set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-error=unused-function")
 
-include_directories(${CMAKE_SOURCE_DIR}/src/common/thirdparty/ae)
+add_subdirectory(redis_module)
+
+# TODO(rkn): We may need to encode the fact that the ray redis module requires
+# some autogenerated flatbuffer files to compile.
 
 set(GCS_FBS_SRC "${CMAKE_CURRENT_LIST_DIR}/format/gcs.fbs")
 set(OUTPUT_DIR ${CMAKE_CURRENT_LIST_DIR}/format/)
diff --git a/src/ray/gcs/asio.h b/src/ray/gcs/asio.h
index 837b6c686ed1c..bbb66a9814aa6 100644
--- a/src/ray/gcs/asio.h
+++ b/src/ray/gcs/asio.h
@@ -29,8 +29,8 @@
 #include <boost/asio/error.hpp>
 #include <boost/bind.hpp>
 
-#include "hiredis/async.h"
-#include "hiredis/hiredis.h"
+#include "ray/thirdparty/hiredis/async.h"
+#include "ray/thirdparty/hiredis/hiredis.h"
 
 class RedisAsioClient {
  public:
diff --git a/src/ray/gcs/asio_test.cc b/src/ray/gcs/asio_test.cc
index 27527ccfff98f..3901766e2b288 100644
--- a/src/ray/gcs/asio_test.cc
+++ b/src/ray/gcs/asio_test.cc
@@ -4,6 +4,11 @@
 #include "gtest/gtest.h"
 #include "ray/util/logging.h"
 
+extern "C" {
+#include "ray/thirdparty/hiredis/async.h"
+#include "ray/thirdparty/hiredis/hiredis.h"
+}
+
 boost::asio::io_service io_service;
 
 void ConnectCallback(const redisAsyncContext *c, int status) {
diff --git a/src/ray/gcs/client.cc b/src/ray/gcs/client.cc
index 182c44a8a8cf8..c1cbee11303e4 100644
--- a/src/ray/gcs/client.cc
+++ b/src/ray/gcs/client.cc
@@ -1,6 +1,7 @@
 #include "ray/gcs/client.h"
 
 #include "ray/gcs/redis_context.h"
+#include "ray/ray_config.h"
 
 static void GetRedisShards(redisContext *context, std::vector<std::string> &addresses,
                            std::vector<int> &ports) {
@@ -71,10 +72,12 @@ namespace gcs {
 
 AsyncGcsClient::AsyncGcsClient(const std::string &address, int port,
                                const ClientID &client_id, CommandType command_type,
-                               bool is_test_client = false) {
+                               bool is_test_client = false,
+                               const std::string &password = "") {
   primary_context_ = std::make_shared<RedisContext>();
 
-  RAY_CHECK_OK(primary_context_->Connect(address, port, /*sharding=*/true));
+  RAY_CHECK_OK(
+      primary_context_->Connect(address, port, /*sharding=*/true, /*password=*/password));
 
   if (!is_test_client) {
     // Moving sharding into constructor defaultly means that sharding = true.
@@ -94,21 +97,22 @@ AsyncGcsClient::AsyncGcsClient(const std::string &address, int port,
 
     RAY_CHECK(shard_contexts_.size() == addresses.size());
     for (size_t i = 0; i < addresses.size(); ++i) {
-      RAY_CHECK_OK(
-          shard_contexts_[i]->Connect(addresses[i], ports[i], /*sharding=*/true));
+      RAY_CHECK_OK(shard_contexts_[i]->Connect(addresses[i], ports[i], /*sharding=*/true,
+                                               /*password=*/password));
     }
   } else {
     shard_contexts_.push_back(std::make_shared<RedisContext>());
-    RAY_CHECK_OK(shard_contexts_[0]->Connect(address, port, /*sharding=*/true));
+    RAY_CHECK_OK(shard_contexts_[0]->Connect(address, port, /*sharding=*/true,
+                                             /*password=*/password));
   }
 
   client_table_.reset(new ClientTable({primary_context_}, this, client_id));
   error_table_.reset(new ErrorTable({primary_context_}, this));
   driver_table_.reset(new DriverTable({primary_context_}, this));
+  heartbeat_batch_table_.reset(new HeartbeatBatchTable({primary_context_}, this));
   // Tables below would be sharded.
   object_table_.reset(new ObjectTable(shard_contexts_, this, command_type));
   actor_table_.reset(new ActorTable(shard_contexts_, this));
-  task_table_.reset(new TaskTable(shard_contexts_, this, command_type));
   raylet_task_table_.reset(new raylet::TaskTable(shard_contexts_, this, command_type));
   task_reconstruction_log_.reset(new TaskReconstructionLog(shard_contexts_, this));
   task_lease_table_.reset(new TaskLeaseTable(shard_contexts_, this));
@@ -126,12 +130,16 @@ AsyncGcsClient::AsyncGcsClient(const std::string &address, int port,
 // Use of kChain currently only applies to Table::Add which affects only the
 // task table, and when RAY_USE_NEW_GCS is set at compile time.
 AsyncGcsClient::AsyncGcsClient(const std::string &address, int port,
-                               const ClientID &client_id, bool is_test_client = false)
-    : AsyncGcsClient(address, port, client_id, CommandType::kChain, is_test_client) {}
+                               const ClientID &client_id, bool is_test_client = false,
+                               const std::string &password = "")
+    : AsyncGcsClient(address, port, client_id, CommandType::kChain, is_test_client,
+                     password) {}
 #else
 AsyncGcsClient::AsyncGcsClient(const std::string &address, int port,
-                               const ClientID &client_id, bool is_test_client = false)
-    : AsyncGcsClient(address, port, client_id, CommandType::kRegular, is_test_client) {}
+                               const ClientID &client_id, bool is_test_client = false,
+                               const std::string &password = "")
+    : AsyncGcsClient(address, port, client_id, CommandType::kRegular, is_test_client,
+                     password) {}
 #endif  // RAY_USE_NEW_GCS
 
 AsyncGcsClient::AsyncGcsClient(const std::string &address, int port,
@@ -143,8 +151,9 @@ AsyncGcsClient::AsyncGcsClient(const std::string &address, int port,
     : AsyncGcsClient(address, port, ClientID::from_random(), command_type,
                      is_test_client) {}
 
-AsyncGcsClient::AsyncGcsClient(const std::string &address, int port)
-    : AsyncGcsClient(address, port, ClientID::from_random()) {}
+AsyncGcsClient::AsyncGcsClient(const std::string &address, int port,
+                               const std::string &password = "")
+    : AsyncGcsClient(address, port, ClientID::from_random(), false, password) {}
 
 AsyncGcsClient::AsyncGcsClient(const std::string &address, int port, bool is_test_client)
     : AsyncGcsClient(address, port, ClientID::from_random(), is_test_client) {}
@@ -171,9 +180,22 @@ Status AsyncGcsClient::Attach(boost::asio::io_service &io_service) {
   return Status::OK();
 }
 
-ObjectTable &AsyncGcsClient::object_table() { return *object_table_; }
+std::string AsyncGcsClient::DebugString() const {
+  std::stringstream result;
+  result << "AsyncGcsClient:";
+  result << "\n- TaskTable: " << raylet_task_table_->DebugString();
+  result << "\n- ActorTable: " << actor_table_->DebugString();
+  result << "\n- TaskReconstructionLog: " << task_reconstruction_log_->DebugString();
+  result << "\n- TaskLeaseTable: " << task_lease_table_->DebugString();
+  result << "\n- HeartbeatTable: " << heartbeat_table_->DebugString();
+  result << "\n- ErrorTable: " << error_table_->DebugString();
+  result << "\n- ProfileTable: " << profile_table_->DebugString();
+  result << "\n- ClientTable: " << client_table_->DebugString();
+  result << "\n- DriverTable: " << driver_table_->DebugString();
+  return result.str();
+}
 
-TaskTable &AsyncGcsClient::task_table() { return *task_table_; }
+ObjectTable &AsyncGcsClient::object_table() { return *object_table_; }
 
 raylet::TaskTable &AsyncGcsClient::raylet_task_table() { return *raylet_task_table_; }
 
@@ -193,6 +215,10 @@ ClassTable &AsyncGcsClient::class_table() { return *class_table_; }
 
 HeartbeatTable &AsyncGcsClient::heartbeat_table() { return *heartbeat_table_; }
 
+HeartbeatBatchTable &AsyncGcsClient::heartbeat_batch_table() {
+  return *heartbeat_batch_table_;
+}
+
 ErrorTable &AsyncGcsClient::error_table() { return *error_table_; }
 
 DriverTable &AsyncGcsClient::driver_table() { return *driver_table_; }
diff --git a/src/ray/gcs/client.h b/src/ray/gcs/client.h
index d89aadd803ea5..e44355571409a 100644
--- a/src/ray/gcs/client.h
+++ b/src/ray/gcs/client.h
@@ -31,13 +31,14 @@ class RAY_EXPORT AsyncGcsClient {
   /// \param command_type GCS command type.  If CommandType::kChain, chain-replicated
   /// versions of the tables might be used, if available.
   AsyncGcsClient(const std::string &address, int port, const ClientID &client_id,
-                 CommandType command_type, bool is_test_client);
+                 CommandType command_type, bool is_test_client,
+                 const std::string &redis_password);
   AsyncGcsClient(const std::string &address, int port, const ClientID &client_id,
-                 bool is_test_client);
+                 bool is_test_client, const std::string &password);
   AsyncGcsClient(const std::string &address, int port, CommandType command_type);
   AsyncGcsClient(const std::string &address, int port, CommandType command_type,
                  bool is_test_client);
-  AsyncGcsClient(const std::string &address, int port);
+  AsyncGcsClient(const std::string &address, int port, const std::string &password);
   AsyncGcsClient(const std::string &address, int port, bool is_test_client);
 
   /// Attach this client to a plasma event loop. Note that only
@@ -53,13 +54,13 @@ class RAY_EXPORT AsyncGcsClient {
   inline CustomSerializerTable &custom_serializer_table();
   inline ConfigTable &config_table();
   ObjectTable &object_table();
-  TaskTable &task_table();
   raylet::TaskTable &raylet_task_table();
   ActorTable &actor_table();
   TaskReconstructionLog &task_reconstruction_log();
   TaskLeaseTable &task_lease_table();
   ClientTable &client_table();
   HeartbeatTable &heartbeat_table();
+  HeartbeatBatchTable &heartbeat_batch_table();
   ErrorTable &error_table();
   DriverTable &driver_table();
   ProfileTable &profile_table();
@@ -75,16 +76,21 @@ class RAY_EXPORT AsyncGcsClient {
   std::vector<std::shared_ptr<RedisContext>> shard_contexts() { return shard_contexts_; }
   std::shared_ptr<RedisContext> primary_context() { return primary_context_; }
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  private:
   std::unique_ptr<FunctionTable> function_table_;
   std::unique_ptr<ClassTable> class_table_;
   std::unique_ptr<ObjectTable> object_table_;
-  std::unique_ptr<TaskTable> task_table_;
   std::unique_ptr<raylet::TaskTable> raylet_task_table_;
   std::unique_ptr<ActorTable> actor_table_;
   std::unique_ptr<TaskReconstructionLog> task_reconstruction_log_;
   std::unique_ptr<TaskLeaseTable> task_lease_table_;
   std::unique_ptr<HeartbeatTable> heartbeat_table_;
+  std::unique_ptr<HeartbeatBatchTable> heartbeat_batch_table_;
   std::unique_ptr<ErrorTable> error_table_;
   std::unique_ptr<ProfileTable> profile_table_;
   std::unique_ptr<ClientTable> client_table_;
diff --git a/src/ray/gcs/client_test.cc b/src/ray/gcs/client_test.cc
index 41d93f296b7e6..a99e4ceb06112 100644
--- a/src/ray/gcs/client_test.cc
+++ b/src/ray/gcs/client_test.cc
@@ -2,9 +2,7 @@
 
 // TODO(pcm): get rid of this and replace with the type safe plasma event loop
 extern "C" {
-#include "hiredis/adapters/ae.h"
-#include "hiredis/async.h"
-#include "hiredis/hiredis.h"
+#include "ray/thirdparty/hiredis/hiredis.h"
 }
 
 #include "ray/gcs/client.h"
@@ -55,35 +53,6 @@ class TestGcs : public ::testing::Test {
 
 TestGcs *test;
 
-class TestGcsWithAe : public TestGcs {
- public:
-  TestGcsWithAe(CommandType command_type) : TestGcs(command_type) {
-    loop_ = aeCreateEventLoop(1024);
-    RAY_CHECK_OK(client_->primary_context()->AttachToEventLoop(loop_));
-    for (auto &context : client_->shard_contexts()) {
-      RAY_CHECK_OK(context->AttachToEventLoop(loop_));
-    }
-  }
-
-  TestGcsWithAe() : TestGcsWithAe(CommandType::kRegular) {}
-
-  ~TestGcsWithAe() override {
-    // Destroy the client first since it has a reference to the event loop.
-    client_.reset();
-    aeDeleteEventLoop(loop_);
-  }
-  void Start() override { aeMain(loop_); }
-  void Stop() override { aeStop(loop_); }
-
- private:
-  aeEventLoop *loop_;
-};
-
-class TestGcsWithChainAe : public TestGcsWithAe {
- public:
-  TestGcsWithChainAe() : TestGcsWithAe(gcs::CommandType::kChain){};
-};
-
 class TestGcsWithAsio : public TestGcs {
  public:
   TestGcsWithAsio(CommandType command_type)
@@ -154,10 +123,8 @@ void TestTableLookup(const JobID &job_id, std::shared_ptr<gcs::AsyncGcsClient> c
     TEST(job_id_, client_);       \
   }
 
-TEST_MACRO(TestGcsWithAe, TestTableLookup);
 TEST_MACRO(TestGcsWithAsio, TestTableLookup);
 #if RAY_USE_NEW_GCS
-TEST_MACRO(TestGcsWithChainAe, TestTableLookup);
 TEST_MACRO(TestGcsWithChainAsio, TestTableLookup);
 #endif
 
@@ -199,11 +166,6 @@ void TestLogLookup(const JobID &job_id, std::shared_ptr<gcs::AsyncGcsClient> cli
   ASSERT_EQ(test->NumCallbacks(), managers.size());
 }
 
-TEST_F(TestGcsWithAe, TestLogLookup) {
-  test = this;
-  TestLogLookup(job_id_, client_);
-}
-
 TEST_F(TestGcsWithAsio, TestLogLookup) {
   test = this;
   TestLogLookup(job_id_, client_);
@@ -231,10 +193,8 @@ void TestTableLookupFailure(const JobID &job_id,
   test->Start();
 }
 
-TEST_MACRO(TestGcsWithAe, TestTableLookupFailure);
 TEST_MACRO(TestGcsWithAsio, TestTableLookupFailure);
 #if RAY_USE_NEW_GCS
-TEST_MACRO(TestGcsWithChainAe, TestTableLookupFailure);
 TEST_MACRO(TestGcsWithChainAsio, TestTableLookupFailure);
 #endif
 
@@ -290,11 +250,6 @@ void TestLogAppendAt(const JobID &job_id, std::shared_ptr<gcs::AsyncGcsClient> c
   ASSERT_EQ(test->NumCallbacks(), 2);
 }
 
-TEST_F(TestGcsWithAe, TestLogAppendAt) {
-  test = this;
-  TestLogAppendAt(job_id_, client_);
-}
-
 TEST_F(TestGcsWithAsio, TestLogAppendAt) {
   test = this;
   TestLogAppendAt(job_id_, client_);
@@ -339,94 +294,6 @@ void TaskLookupAfterUpdateFailure(gcs::AsyncGcsClient *client, const TaskID &id)
   test->Stop();
 }
 
-void TaskUpdateCallback(gcs::AsyncGcsClient *client, const TaskID &task_id,
-                        const TaskTableDataT &task, bool updated) {
-  RAY_CHECK_OK(client->task_table().Lookup(DriverID::nil(), task_id,
-                                           &TaskLookupAfterUpdate, &TaskLookupFailure));
-}
-
-void TestTaskTable(const JobID &job_id, std::shared_ptr<gcs::AsyncGcsClient> client) {
-  auto data = std::make_shared<TaskTableDataT>();
-  data->scheduling_state = SchedulingState::SCHEDULED;
-  ClientID local_scheduler_id = ClientID::from_binary(kRandomId);
-  data->scheduler_id = local_scheduler_id.binary();
-  TaskID task_id = TaskID::from_random();
-  RAY_CHECK_OK(client->task_table().Add(job_id, task_id, data, &TaskAdded));
-  RAY_CHECK_OK(
-      client->task_table().Lookup(job_id, task_id, &TaskLookup, &TaskLookupFailure));
-  auto update = std::make_shared<TaskTableTestAndUpdateT>();
-  update->test_scheduler_id = local_scheduler_id.binary();
-  update->test_state_bitmask = SchedulingState::SCHEDULED;
-  update->update_state = SchedulingState::LOST;
-  // After test-and-setting, the callback will lookup the current state of the
-  // task.
-  RAY_CHECK_OK(
-      client->task_table().TestAndUpdate(job_id, task_id, update, &TaskUpdateCallback));
-  // Run the event loop. The loop will only stop if the lookup after the
-  // test-and-set succeeds (or an assertion failure).
-  test->Start();
-}
-
-TEST_MACRO(TestGcsWithAe, TestTaskTable);
-TEST_MACRO(TestGcsWithAsio, TestTaskTable);
-#if RAY_USE_NEW_GCS
-TEST_MACRO(TestGcsWithChainAe, TestTaskTable);
-TEST_MACRO(TestGcsWithChainAsio, TestTaskTable);
-#endif
-
-void TestTableSubscribeAll(const JobID &job_id,
-                           std::shared_ptr<gcs::AsyncGcsClient> client) {
-  TaskID task_id = TaskID::from_random();
-  std::vector<std::string> task_specs = {"abc", "def", "ghi"};
-  // Callback for a notification.
-  auto notification_callback = [task_id, task_specs](
-      gcs::AsyncGcsClient *client, const UniqueID &id, const protocol::TaskT &data) {
-    ASSERT_EQ(id, task_id);
-    // Check that we get notifications in the same order as the writes.
-    ASSERT_EQ(data.task_specification, task_specs[test->NumCallbacks()]);
-    test->IncrementNumCallbacks();
-    if (test->NumCallbacks() == task_specs.size()) {
-      test->Stop();
-    }
-  };
-
-  // The failure callback should not be called if we are subscribing to
-  // notifications for all keys.
-  auto failure_callback = [](gcs::AsyncGcsClient *client, const UniqueID &id) {
-    RAY_CHECK(false);
-  };
-
-  // Callback for subscription success. We are guaranteed to receive
-  // notifications after this is called.
-  auto subscribe_callback = [job_id, task_id, task_specs](gcs::AsyncGcsClient *client) {
-    // We have subscribed. Do the writes to the table.
-    for (const auto &task_spec : task_specs) {
-      auto data = std::make_shared<protocol::TaskT>();
-      data->task_specification = task_spec;
-      RAY_CHECK_OK(client->raylet_task_table().Add(job_id, task_id, data, nullptr));
-    }
-  };
-
-  // Subscribe to all task table notifications. Once we have successfully
-  // subscribed, we will write the key several times and check that we get
-  // notified for each.
-  RAY_CHECK_OK(client->raylet_task_table().Subscribe(
-      job_id, ClientID::nil(), notification_callback, failure_callback,
-      subscribe_callback));
-  // Run the event loop. The loop will only stop if the registered subscription
-  // callback is called (or an assertion failure).
-  test->Start();
-  // Check that we received one notification callback for each write.
-  ASSERT_EQ(test->NumCallbacks(), task_specs.size());
-}
-
-TEST_MACRO(TestGcsWithAe, TestTableSubscribeAll);
-TEST_MACRO(TestGcsWithAsio, TestTableSubscribeAll);
-#if RAY_USE_NEW_GCS
-TEST_MACRO(TestGcsWithChainAe, TestTableSubscribeAll);
-TEST_MACRO(TestGcsWithChainAsio, TestTableSubscribeAll);
-#endif
-
 void TestLogSubscribeAll(const JobID &job_id,
                          std::shared_ptr<gcs::AsyncGcsClient> client) {
   std::vector<std::string> managers = {"abc", "def", "ghi"};
@@ -473,11 +340,6 @@ void TestLogSubscribeAll(const JobID &job_id,
   ASSERT_EQ(test->NumCallbacks(), managers.size());
 }
 
-TEST_F(TestGcsWithAe, TestLogSubscribeAll) {
-  test = this;
-  TestLogSubscribeAll(job_id_, client_);
-}
-
 TEST_F(TestGcsWithAsio, TestLogSubscribeAll) {
   test = this;
   TestLogSubscribeAll(job_id_, client_);
@@ -554,10 +416,8 @@ void TestTableSubscribeId(const JobID &job_id,
   ASSERT_EQ(test->NumCallbacks(), task_specs2.size());
 }
 
-TEST_MACRO(TestGcsWithAe, TestTableSubscribeId);
 TEST_MACRO(TestGcsWithAsio, TestTableSubscribeId);
 #if RAY_USE_NEW_GCS
-TEST_MACRO(TestGcsWithChainAe, TestTableSubscribeId);
 TEST_MACRO(TestGcsWithChainAsio, TestTableSubscribeId);
 #endif
 
@@ -630,11 +490,6 @@ void TestLogSubscribeId(const JobID &job_id,
   ASSERT_EQ(test->NumCallbacks(), managers2.size());
 }
 
-TEST_F(TestGcsWithAe, TestLogSubscribeId) {
-  test = this;
-  TestLogSubscribeId(job_id_, client_);
-}
-
 TEST_F(TestGcsWithAsio, TestLogSubscribeId) {
   test = this;
   TestLogSubscribeId(job_id_, client_);
@@ -709,10 +564,8 @@ void TestTableSubscribeCancel(const JobID &job_id,
   ASSERT_EQ(test->NumCallbacks(), 2);
 }
 
-TEST_MACRO(TestGcsWithAe, TestTableSubscribeCancel);
 TEST_MACRO(TestGcsWithAsio, TestTableSubscribeCancel);
 #if RAY_USE_NEW_GCS
-TEST_MACRO(TestGcsWithChainAe, TestTableSubscribeCancel);
 TEST_MACRO(TestGcsWithChainAsio, TestTableSubscribeCancel);
 #endif
 
@@ -782,11 +635,6 @@ void TestLogSubscribeCancel(const JobID &job_id,
   ASSERT_EQ(test->NumCallbacks(), managers.size() + 1);
 }
 
-TEST_F(TestGcsWithAe, TestLogSubscribeCancel) {
-  test = this;
-  TestLogSubscribeCancel(job_id_, client_);
-}
-
 TEST_F(TestGcsWithAsio, TestLogSubscribeCancel) {
   test = this;
   TestLogSubscribeCancel(job_id_, client_);
@@ -800,7 +648,8 @@ void ClientTableNotification(gcs::AsyncGcsClient *client, const ClientID &client
   ASSERT_EQ(ClientID::from_binary(data.client_id), added_id);
   ASSERT_EQ(data.is_insertion, is_insertion);
 
-  auto cached_client = client->client_table().GetClient(added_id);
+  ClientTableDataT cached_client;
+  client->client_table().GetClient(added_id, cached_client);
   ASSERT_EQ(ClientID::from_binary(cached_client.client_id), added_id);
   ASSERT_EQ(cached_client.is_insertion, is_insertion);
 }
diff --git a/src/ray/gcs/format/gcs.fbs b/src/ray/gcs/format/gcs.fbs
index ee667aaea815f..6414613d45840 100644
--- a/src/ray/gcs/format/gcs.fbs
+++ b/src/ray/gcs/format/gcs.fbs
@@ -15,6 +15,7 @@ enum TablePrefix:int {
   FUNCTION,
   TASK_RECONSTRUCTION,
   HEARTBEAT,
+  HEARTBEAT_BATCH,
   ERROR_INFO,
   DRIVER,
   PROFILE,
@@ -30,11 +31,75 @@ enum TablePubsub:int {
   OBJECT,
   ACTOR,
   HEARTBEAT,
+  HEARTBEAT_BATCH,
   ERROR_INFO,
   TASK_LEASE,
   DRIVER,
 }
 
+table Arg {
+  // Object ID for pass-by-reference arguments. Normally there is only one
+  // object ID in this list which represents the object that is being passed.
+  // However to support reducers in a MapReduce workload, we also support
+  // passing multiple object IDs for each argument.
+  object_ids: [string];
+  // Data for pass-by-value arguments.
+  data: string;
+}
+
+table TaskInfo {
+  // ID of the driver that created this task.
+  driver_id: string;
+  // Task ID of the task.
+  task_id: string;
+  // Task ID of the parent task.
+  parent_task_id: string;
+  // A count of the number of tasks submitted by the parent task before this one.
+  parent_counter: int;
+  // The ID of the actor to create if this is an actor creation task.
+  actor_creation_id: string;
+  // The dummy object ID of the actor creation task if this is an actor method.
+  actor_creation_dummy_object_id: string;
+  // Actor ID of the task. This is the actor that this task is executed on
+  // or NIL_ACTOR_ID if the task is just a normal task.
+  actor_id: string;
+  // The ID of the handle that was used to submit the task. This should be
+  // unique across handles with the same actor_id.
+  actor_handle_id: string;
+  // Number of tasks that have been submitted to this actor so far.
+  actor_counter: int;
+  // True if this task is an actor checkpoint task and false otherwise.
+  is_actor_checkpoint_method: bool;
+  // Function ID of the task.
+  function_id: string;
+  // Task arguments.
+  args: [Arg];
+  // Object IDs of return values.
+  returns: [string];
+  // The required_resources vector indicates the quantities of the different
+  // resources required by this task.
+  required_resources: [ResourcePair];
+  // The resources required for placing this task on a node. If this is empty,
+  // then the placement resources are equal to the required_resources.
+  required_placement_resources: [ResourcePair];
+  // The language that this task belongs to.
+  language: Language;
+  // Function descriptor, which is a list of strings that can
+  // uniquely describe a function.
+  // For a Python function, it should be: [module_name, class_name, function_name]
+  // For a Java function, it should be: [class_name, method_name, type_descriptor]
+  // TODO(hchen): after changing Python worker to use function_descriptor,
+  // function_id can be removed.
+  function_descriptor: [string];
+}
+
+table ResourcePair {
+  // The name of the resource.
+  key: string;
+  // The quantity of the resource.
+  value: double;
+}
+
 table GcsTableEntry {
   id: string;
   entries: [string];
@@ -99,6 +164,13 @@ table TaskTableTestAndUpdate {
 table ClassTableData {
 }
 
+enum ActorState:int {
+  // Actor is alive.
+  ALIVE = 0,
+  // Actor is already dead and won't be reconstructed.
+  DEAD
+}
+
 table ActorTableData {
   // The ID of the actor that was created.
   actor_id: string;
@@ -110,6 +182,8 @@ table ActorTableData {
   driver_id: string;
   // The ID of the node manager that created the actor.
   node_manager_id: string;
+  // Current state of this actor.
+  state: ActorState;
 }
 
 table ErrorTableData {
@@ -199,6 +273,10 @@ table HeartbeatTableData {
   resource_load_capacity: [double];
 }
 
+table HeartbeatBatchTableData {
+  batch: [HeartbeatTableData];
+}
+
 // Data for a lease on task execution.
 table TaskLeaseData {
   // Node manager client ID.
diff --git a/src/ray/gcs/redis_context.cc b/src/ray/gcs/redis_context.cc
index abc06a24a8994..dde1998a424f5 100644
--- a/src/ray/gcs/redis_context.cc
+++ b/src/ray/gcs/redis_context.cc
@@ -5,13 +5,13 @@
 #include <sstream>
 
 extern "C" {
-#include "hiredis/adapters/ae.h"
-#include "hiredis/async.h"
-#include "hiredis/hiredis.h"
+#include "ray/thirdparty/hiredis/adapters/ae.h"
+#include "ray/thirdparty/hiredis/async.h"
+#include "ray/thirdparty/hiredis/hiredis.h"
 }
 
 // TODO(pcm): Integrate into the C++ tree.
-#include "state/ray_config.h"
+#include "ray/ray_config.h"
 
 namespace {
 
@@ -135,43 +135,72 @@ RedisContext::~RedisContext() {
   }
 }
 
-Status RedisContext::Connect(const std::string &address, int port, bool sharding) {
+Status AuthenticateRedis(redisContext *context, const std::string &password) {
+  if (password == "") {
+    return Status::OK();
+  }
+  redisReply *reply =
+      reinterpret_cast<redisReply *>(redisCommand(context, "AUTH %s", password.c_str()));
+  REDIS_CHECK_ERROR(context, reply);
+  freeReplyObject(reply);
+  return Status::OK();
+}
+
+Status AuthenticateRedis(redisAsyncContext *context, const std::string &password) {
+  if (password == "") {
+    return Status::OK();
+  }
+  int status = redisAsyncCommand(context, NULL, NULL, "AUTH %s", password.c_str());
+  if (status == REDIS_ERR) {
+    return Status::RedisError(std::string(context->errstr));
+  }
+  return Status::OK();
+}
+
+template <typename RedisContext, typename RedisConnectFunction>
+Status ConnectWithRetries(const std::string &address, int port,
+                          const RedisConnectFunction &connect_function,
+                          RedisContext **context) {
   int connection_attempts = 0;
-  context_ = redisConnect(address.c_str(), port);
-  while (context_ == nullptr || context_->err) {
+  *context = connect_function(address.c_str(), port);
+  while (*context == nullptr || (*context)->err) {
     if (connection_attempts >= RayConfig::instance().redis_db_connect_retries()) {
-      if (context_ == nullptr) {
+      if (*context == nullptr) {
         RAY_LOG(FATAL) << "Could not allocate redis context.";
       }
-      if (context_->err) {
+      if ((*context)->err) {
         RAY_LOG(FATAL) << "Could not establish connection to redis " << address << ":"
-                       << port;
+                       << port << " (context.err = " << (*context)->err << ")";
       }
       break;
     }
     RAY_LOG(WARNING) << "Failed to connect to Redis, retrying.";
     // Sleep for a little.
     usleep(RayConfig::instance().redis_db_connect_wait_milliseconds() * 1000);
-    context_ = redisConnect(address.c_str(), port);
+    *context = connect_function(address.c_str(), port);
     connection_attempts += 1;
   }
+  return Status::OK();
+}
+
+Status RedisContext::Connect(const std::string &address, int port, bool sharding,
+                             const std::string &password = "") {
+  RAY_CHECK_OK(ConnectWithRetries(address, port, redisConnect, &context_));
+  RAY_CHECK_OK(AuthenticateRedis(context_, password));
+
   redisReply *reply = reinterpret_cast<redisReply *>(
       redisCommand(context_, "CONFIG SET notify-keyspace-events Kl"));
   REDIS_CHECK_ERROR(context_, reply);
   freeReplyObject(reply);
 
   // Connect to async context
-  async_context_ = redisAsyncConnect(address.c_str(), port);
-  if (async_context_ == nullptr || async_context_->err) {
-    RAY_LOG(FATAL) << "Could not establish connection to redis " << address << ":"
-                   << port;
-  }
+  RAY_CHECK_OK(ConnectWithRetries(address, port, redisAsyncConnect, &async_context_));
+  RAY_CHECK_OK(AuthenticateRedis(async_context_, password));
+
   // Connect to subscribe context
-  subscribe_context_ = redisAsyncConnect(address.c_str(), port);
-  if (subscribe_context_ == nullptr || subscribe_context_->err) {
-    RAY_LOG(FATAL) << "Could not establish subscribe connection to redis " << address
-                   << ":" << port;
-  }
+  RAY_CHECK_OK(ConnectWithRetries(address, port, redisAsyncConnect, &subscribe_context_));
+  RAY_CHECK_OK(AuthenticateRedis(subscribe_context_, password));
+
   return Status::OK();
 }
 
diff --git a/src/ray/gcs/redis_context.h b/src/ray/gcs/redis_context.h
index 67bc8197c3029..1fcfd55adab11 100644
--- a/src/ray/gcs/redis_context.h
+++ b/src/ray/gcs/redis_context.h
@@ -51,7 +51,8 @@ class RedisContext {
   RedisContext()
       : context_(nullptr), async_context_(nullptr), subscribe_context_(nullptr) {}
   ~RedisContext();
-  Status Connect(const std::string &address, int port, bool sharding);
+  Status Connect(const std::string &address, int port, bool sharding,
+                 const std::string &password);
   Status AttachToEventLoop(aeEventLoop *loop);
 
   /// Run an operation on some table key.
diff --git a/src/common/redis_module/CMakeLists.txt b/src/ray/gcs/redis_module/CMakeLists.txt
similarity index 100%
rename from src/common/redis_module/CMakeLists.txt
rename to src/ray/gcs/redis_module/CMakeLists.txt
diff --git a/src/common/redis_module/chain_module.h b/src/ray/gcs/redis_module/chain_module.h
similarity index 84%
rename from src/common/redis_module/chain_module.h
rename to src/ray/gcs/redis_module/chain_module.h
index c713be2f23389..bb7868eb1bda3 100644
--- a/src/common/redis_module/chain_module.h
+++ b/src/ray/gcs/redis_module/chain_module.h
@@ -38,13 +38,12 @@ class RedisChainModule {
   // It is okay for this NodeFunc to call "RM_FreeString(mutated_key_str)" after
   // assigning the fourth arg, since that call presumably only decrements a ref
   // count.
-  using NodeFunc = std::function<
-      int(RedisModuleCtx *, RedisModuleString **, int, RedisModuleString **)>;
+  using NodeFunc = std::function<int(RedisModuleCtx *, RedisModuleString **, int,
+                                     RedisModuleString **)>;
 
   // A function that (1) runs only after all NodeFunc's have run, and (2) runs
   // once on the tail.  A typical usage is to publish a write.
-  using TailFunc =
-      std::function<int(RedisModuleCtx *, RedisModuleString **, int)>;
+  using TailFunc = std::function<int(RedisModuleCtx *, RedisModuleString **, int)>;
 
   // TODO(zongheng): document the RM_Reply semantics.
 
@@ -56,11 +55,8 @@ class RedisChainModule {
   // final tail_func().
   //
   // TODO(zongheng): currently only supports 1-node chain.
-  int ChainReplicate(RedisModuleCtx *ctx,
-                     RedisModuleString **argv,
-                     int argc,
-                     NodeFunc node_func,
-                     TailFunc tail_func);
+  int ChainReplicate(RedisModuleCtx *ctx, RedisModuleString **argv, int argc,
+                     NodeFunc node_func, TailFunc tail_func);
 };
 
 #endif  // RAY_CHAIN_MODULE_H_
diff --git a/src/ray/gcs/redis_module/ray_redis_module.cc b/src/ray/gcs/redis_module/ray_redis_module.cc
new file mode 100644
index 0000000000000..f832f9e186095
--- /dev/null
+++ b/src/ray/gcs/redis_module/ray_redis_module.cc
@@ -0,0 +1,691 @@
+#include <string.h>
+
+#include "ray/common/common_protocol.h"
+#include "ray/gcs/format/gcs_generated.h"
+#include "ray/id.h"
+#include "ray/util/logging.h"
+#include "redis_string.h"
+#include "redismodule.h"
+
+#if RAY_USE_NEW_GCS
+// Under this flag, ray-project/credis will be loaded.  Specifically, via
+// "path/redis-server --loadmodule <credis module> --loadmodule <current
+// libray_redis_module>" (dlopen() under the hood) will a definition of "module"
+// be supplied.
+//
+// All commands in this file that depend on "module" must be wrapped by "#if
+// RAY_USE_NEW_GCS", until we switch to this launch configuration as the
+// default.
+#include "chain_module.h"
+extern RedisChainModule module;
+#endif
+
+// Various tables are maintained in redis:
+//
+// == OBJECT TABLE ==
+//
+// This consists of two parts:
+// - The object location table, indexed by OL:object_id, which is the set of
+//   plasma manager indices that have access to the object.
+//   (In redis this is represented by a zset (sorted set).)
+//
+// - The object info table, indexed by OI:object_id, which is a hashmap of:
+//     "hash" -> the hash of the object,
+//     "data_size" -> the size of the object in bytes,
+//     "task" -> the task ID that generated this object.
+//     "is_put" -> 0 or 1.
+//
+// == TASK TABLE ==
+//
+// It maps each TT:task_id to a hash:
+//   "state" -> the state of the task, encoded as a bit mask of scheduling_state
+//              enum values in task.h,
+//   "local_scheduler_id" -> the ID of the local scheduler the task is assigned
+//                           to,
+//   "TaskSpec" -> serialized bytes of a TaskInfo (defined in common.fbs), which
+//                 describes the details this task.
+//
+// See also the definition of TaskReply in common.fbs.
+
+#define OBJECT_INFO_PREFIX "OI:"
+#define OBJECT_LOCATION_PREFIX "OL:"
+#define OBJECT_NOTIFICATION_PREFIX "ON:"
+#define TASK_PREFIX "TT:"
+#define OBJECT_BCAST "BCAST"
+
+#define OBJECT_CHANNEL_PREFIX "OC:"
+
+#define CHECK_ERROR(STATUS, MESSAGE)                   \
+  if ((STATUS) == REDISMODULE_ERR) {                   \
+    return RedisModule_ReplyWithError(ctx, (MESSAGE)); \
+  }
+
+/// Parse a Redis string into a TablePubsub channel.
+TablePubsub ParseTablePubsub(const RedisModuleString *pubsub_channel_str) {
+  long long pubsub_channel_long;
+  RAY_CHECK(RedisModule_StringToLongLong(pubsub_channel_str, &pubsub_channel_long) ==
+            REDISMODULE_OK)
+      << "Pubsub channel must be a valid TablePubsub";
+  auto pubsub_channel = static_cast<TablePubsub>(pubsub_channel_long);
+  RAY_CHECK(pubsub_channel >= TablePubsub::MIN && pubsub_channel <= TablePubsub::MAX)
+      << "Pubsub channel must be a valid TablePubsub";
+  return pubsub_channel;
+}
+
+/// Format a pubsub channel for a specific key. pubsub_channel_str should
+/// contain a valid TablePubsub.
+RedisModuleString *FormatPubsubChannel(RedisModuleCtx *ctx,
+                                       const RedisModuleString *pubsub_channel_str,
+                                       const RedisModuleString *id) {
+  // Format the pubsub channel enum to a string. TablePubsub_MAX should be more
+  // than enough digits, but add 1 just in case for the null terminator.
+  char pubsub_channel[static_cast<int>(TablePubsub::MAX) + 1];
+  sprintf(pubsub_channel, "%d", static_cast<int>(ParseTablePubsub(pubsub_channel_str)));
+  return RedisString_Format(ctx, "%s:%S", pubsub_channel, id);
+}
+
+// TODO(swang): This helper function should be deprecated by the version below,
+// which uses enums for table prefixes.
+RedisModuleKey *OpenPrefixedKey(RedisModuleCtx *ctx, const char *prefix,
+                                RedisModuleString *keyname, int mode,
+                                RedisModuleString **mutated_key_str) {
+  RedisModuleString *prefixed_keyname = RedisString_Format(ctx, "%s%S", prefix, keyname);
+  // Pass out the key being mutated, should the caller request so.
+  if (mutated_key_str != nullptr) {
+    *mutated_key_str = prefixed_keyname;
+  }
+  RedisModuleKey *key =
+      (RedisModuleKey *)RedisModule_OpenKey(ctx, prefixed_keyname, mode);
+  return key;
+}
+
+RedisModuleKey *OpenPrefixedKey(RedisModuleCtx *ctx, RedisModuleString *prefix_enum,
+                                RedisModuleString *keyname, int mode,
+                                RedisModuleString **mutated_key_str) {
+  long long prefix_long;
+  RAY_CHECK(RedisModule_StringToLongLong(prefix_enum, &prefix_long) == REDISMODULE_OK)
+      << "Prefix must be a valid TablePrefix";
+  auto prefix = static_cast<TablePrefix>(prefix_long);
+  RAY_CHECK(prefix != TablePrefix::UNUSED) << "This table has no prefix registered";
+  RAY_CHECK(prefix >= TablePrefix::MIN && prefix <= TablePrefix::MAX)
+      << "Prefix must be a valid TablePrefix";
+  return OpenPrefixedKey(ctx, EnumNameTablePrefix(prefix), keyname, mode,
+                         mutated_key_str);
+}
+
+RedisModuleKey *OpenPrefixedKey(RedisModuleCtx *ctx, const char *prefix,
+                                RedisModuleString *keyname, int mode) {
+  return OpenPrefixedKey(ctx, prefix, keyname, mode,
+                         /*mutated_key_str=*/nullptr);
+}
+
+RedisModuleKey *OpenPrefixedKey(RedisModuleCtx *ctx, RedisModuleString *prefix_enum,
+                                RedisModuleString *keyname, int mode) {
+  return OpenPrefixedKey(ctx, prefix_enum, keyname, mode,
+                         /*mutated_key_str=*/nullptr);
+}
+
+/// Open the key used to store the channels that should be published to when an
+/// update happens at the given keyname.
+RedisModuleKey *OpenBroadcastKey(RedisModuleCtx *ctx,
+                                 RedisModuleString *pubsub_channel_str,
+                                 RedisModuleString *keyname, int mode) {
+  RedisModuleString *channel = FormatPubsubChannel(ctx, pubsub_channel_str, keyname);
+  RedisModuleString *prefixed_keyname = RedisString_Format(ctx, "BCAST:%S", channel);
+  RedisModuleKey *key =
+      (RedisModuleKey *)RedisModule_OpenKey(ctx, prefixed_keyname, mode);
+  return key;
+}
+
+/**
+ * This is a helper method to convert a redis module string to a flatbuffer
+ * string.
+ *
+ * @param fbb The flatbuffer builder.
+ * @param redis_string The redis string.
+ * @return The flatbuffer string.
+ */
+flatbuffers::Offset<flatbuffers::String> RedisStringToFlatbuf(
+    flatbuffers::FlatBufferBuilder &fbb, RedisModuleString *redis_string) {
+  size_t redis_string_size;
+  const char *redis_string_str =
+      RedisModule_StringPtrLen(redis_string, &redis_string_size);
+  return fbb.CreateString(redis_string_str, redis_string_size);
+}
+
+/// Publish a notification for a new entry at a key. This publishes a
+/// notification to all subscribers of the table, as well as every client that
+/// has requested notifications for this key.
+///
+/// \param pubsub_channel_str The pubsub channel name that notifications for
+///        this key should be published to. When publishing to a specific
+///        client, the channel name should be <pubsub_channel>:<client_id>.
+/// \param id The ID of the key that the notification is about.
+/// \param data The data to publish.
+/// \return OK if there is no error during a publish.
+int PublishTableAdd(RedisModuleCtx *ctx, RedisModuleString *pubsub_channel_str,
+                    RedisModuleString *id, RedisModuleString *data) {
+  // Serialize the notification to send.
+  flatbuffers::FlatBufferBuilder fbb;
+  auto data_flatbuf = RedisStringToFlatbuf(fbb, data);
+  auto message = CreateGcsTableEntry(fbb, RedisStringToFlatbuf(fbb, id),
+                                     fbb.CreateVector(&data_flatbuf, 1));
+  fbb.Finish(message);
+
+  // Write the data back to any subscribers that are listening to all table
+  // notifications.
+  RedisModuleCallReply *reply = RedisModule_Call(ctx, "PUBLISH", "sb", pubsub_channel_str,
+                                                 fbb.GetBufferPointer(), fbb.GetSize());
+  if (reply == NULL) {
+    return RedisModule_ReplyWithError(ctx, "error during PUBLISH");
+  }
+
+  // Publish the data to any clients who requested notifications on this key.
+  RedisModuleKey *notification_key =
+      OpenBroadcastKey(ctx, pubsub_channel_str, id, REDISMODULE_READ | REDISMODULE_WRITE);
+  if (RedisModule_KeyType(notification_key) != REDISMODULE_KEYTYPE_EMPTY) {
+    // NOTE(swang): Sets are not implemented yet, so we use ZSETs instead.
+    CHECK_ERROR(
+        RedisModule_ZsetFirstInScoreRange(notification_key, REDISMODULE_NEGATIVE_INFINITE,
+                                          REDISMODULE_POSITIVE_INFINITE, 1, 1),
+        "Unable to initialize zset iterator");
+    for (; !RedisModule_ZsetRangeEndReached(notification_key);
+         RedisModule_ZsetRangeNext(notification_key)) {
+      RedisModuleString *client_channel =
+          RedisModule_ZsetRangeCurrentElement(notification_key, NULL);
+      RedisModuleCallReply *reply = RedisModule_Call(
+          ctx, "PUBLISH", "sb", client_channel, fbb.GetBufferPointer(), fbb.GetSize());
+      if (reply == NULL) {
+        return RedisModule_ReplyWithError(ctx, "error during PUBLISH");
+      }
+    }
+  }
+  return RedisModule_ReplyWithSimpleString(ctx, "OK");
+}
+
+// RAY.TABLE_ADD:
+//   TableAdd_RedisCommand: the actual command handler.
+//   (helper) TableAdd_DoWrite: performs the write to redis state.
+//   (helper) TableAdd_DoPublish: performs a publish after the write.
+//   ChainTableAdd_RedisCommand: the same command, chain-enabled.
+
+int TableAdd_DoWrite(RedisModuleCtx *ctx, RedisModuleString **argv, int argc,
+                     RedisModuleString **mutated_key_str) {
+  if (argc != 5) {
+    return RedisModule_WrongArity(ctx);
+  }
+  RedisModuleString *prefix_str = argv[1];
+  RedisModuleString *id = argv[3];
+  RedisModuleString *data = argv[4];
+
+  RedisModuleKey *key = OpenPrefixedKey(
+      ctx, prefix_str, id, REDISMODULE_READ | REDISMODULE_WRITE, mutated_key_str);
+  RedisModule_StringSet(key, data);
+  return REDISMODULE_OK;
+}
+
+int TableAdd_DoPublish(RedisModuleCtx *ctx, RedisModuleString **argv, int argc) {
+  if (argc != 5) {
+    return RedisModule_WrongArity(ctx);
+  }
+  RedisModuleString *pubsub_channel_str = argv[2];
+  RedisModuleString *id = argv[3];
+  RedisModuleString *data = argv[4];
+
+  TablePubsub pubsub_channel = ParseTablePubsub(pubsub_channel_str);
+
+  if (pubsub_channel != TablePubsub::NO_PUBLISH) {
+    // All other pubsub channels write the data back directly onto the channel.
+    return PublishTableAdd(ctx, pubsub_channel_str, id, data);
+  } else {
+    return RedisModule_ReplyWithSimpleString(ctx, "OK");
+  }
+}
+
+/// Add an entry at a key. This overwrites any existing data at the key.
+/// Publishes a notification about the update to all subscribers, if a pubsub
+/// channel is provided.
+///
+/// This is called from a client with the command:
+///
+///    RAY.TABLE_ADD <table_prefix> <pubsub_channel> <id> <data>
+///
+/// \param table_prefix The prefix string for keys in this table.
+/// \param pubsub_channel The pubsub channel name that notifications for
+///  this key should be published to. When publishing to a specific
+///  client, the channel name should be <pubsub_channel>:<client_id>.
+/// \param id The ID of the key to set.
+/// \param data The data to insert at the key.
+/// \return The current value at the key, or OK if there is no value.
+int TableAdd_RedisCommand(RedisModuleCtx *ctx, RedisModuleString **argv, int argc) {
+  RedisModule_AutoMemory(ctx);
+  TableAdd_DoWrite(ctx, argv, argc, /*mutated_key_str=*/nullptr);
+  return TableAdd_DoPublish(ctx, argv, argc);
+}
+
+#if RAY_USE_NEW_GCS
+int ChainTableAdd_RedisCommand(RedisModuleCtx *ctx, RedisModuleString **argv, int argc) {
+  RedisModule_AutoMemory(ctx);
+  return module.ChainReplicate(ctx, argv, argc, /*node_func=*/TableAdd_DoWrite,
+                               /*tail_func=*/TableAdd_DoPublish);
+}
+#endif
+
+int TableAppend_DoWrite(RedisModuleCtx *ctx, RedisModuleString **argv, int argc,
+                        RedisModuleString **mutated_key_str) {
+  if (argc < 5 || argc > 6) {
+    return RedisModule_WrongArity(ctx);
+  }
+
+  RedisModuleString *prefix_str = argv[1];
+  RedisModuleString *id = argv[3];
+  RedisModuleString *data = argv[4];
+  RedisModuleString *index_str = nullptr;
+  if (argc == 6) {
+    index_str = argv[5];
+  }
+
+  // Set the keys in the table.
+  RedisModuleKey *key = OpenPrefixedKey(
+      ctx, prefix_str, id, REDISMODULE_READ | REDISMODULE_WRITE, mutated_key_str);
+  // Determine the index at which the data should be appended. If no index is
+  // requested, then is the current length of the log.
+  size_t index = RedisModule_ValueLength(key);
+  if (index_str != nullptr) {
+    // Parse the requested index.
+    long long requested_index;
+    RAY_CHECK(RedisModule_StringToLongLong(index_str, &requested_index) ==
+              REDISMODULE_OK);
+    RAY_CHECK(requested_index >= 0);
+    index = static_cast<size_t>(requested_index);
+  }
+  // Only perform the append if the requested index matches the current length
+  // of the log, or if no index was requested.
+  if (index == RedisModule_ValueLength(key)) {
+    // The requested index matches the current length of the log or no index
+    // was requested. Perform the append.
+    int flags = REDISMODULE_ZADD_NX;
+    RedisModule_ZsetAdd(key, index, data, &flags);
+    // Check that we actually add a new entry during the append. This is only
+    // necessary since we implement the log with a sorted set, so all entries
+    // must be unique, or else we will have gaps in the log.
+    // TODO(rkn): We need to get rid of this uniqueness requirement. We can
+    // easily have multiple log events with the same message.
+    if (flags != REDISMODULE_ZADD_ADDED) {
+      // The following code is a workaround to store the data at a new unique
+      // key. This is so redis doesn't crash (we currently have duplicate keys
+      // for error conditions, which get delivered via pubsub).
+      size_t len;
+      const char *id_str = RedisModule_StringPtrLen(id, &len);
+      RAY_LOG(INFO) << "Duplicate key: " << std::string(id_str, len);
+      // Store the value into a unique new key, just to keep track of it and
+      // make sure the log size grows.
+      std::string postfix = std::to_string(index);
+      RedisModuleString *new_id =
+          RedisString_Format(ctx, "%S:%b", id, postfix.data(), postfix.size());
+      RedisModuleKey *new_key = OpenPrefixedKey(
+          ctx, prefix_str, new_id, REDISMODULE_READ | REDISMODULE_WRITE, mutated_key_str);
+      RedisModule_ZsetAdd(new_key, index, data, &flags);
+      RAY_CHECK(flags == REDISMODULE_ZADD_ADDED);
+    }
+    return REDISMODULE_OK;
+  } else {
+    // The requested index did not match the current length of the log. Return
+    // an error message as a string.
+    static const char *reply = "ERR entry exists";
+    RedisModule_ReplyWithStringBuffer(ctx, reply, strlen(reply));
+    return REDISMODULE_ERR;
+  }
+}
+
+int TableAppend_DoPublish(RedisModuleCtx *ctx, RedisModuleString **argv, int /*argc*/) {
+  RedisModuleString *pubsub_channel_str = argv[2];
+  RedisModuleString *id = argv[3];
+  RedisModuleString *data = argv[4];
+  // Publish a message on the requested pubsub channel if necessary.
+  TablePubsub pubsub_channel = ParseTablePubsub(pubsub_channel_str);
+  if (pubsub_channel != TablePubsub::NO_PUBLISH) {
+    // All other pubsub channels write the data back directly onto the
+    // channel.
+    return PublishTableAdd(ctx, pubsub_channel_str, id, data);
+  } else {
+    return RedisModule_ReplyWithSimpleString(ctx, "OK");
+  }
+}
+
+/// Append an entry to the log stored at a key. Publishes a notification about
+/// the update to all subscribers, if a pubsub channel is provided.
+///
+/// This is called from a client with the command:
+//
+///    RAY.TABLE_APPEND <table_prefix> <pubsub_channel> <id> <data>
+///                     <index (optional)>
+///
+/// \param table_prefix The prefix string for keys in this table.
+/// \param pubsub_channel The pubsub channel name that notifications for
+///        this key should be published to. When publishing to a specific
+///        client, the channel name should be <pubsub_channel>:<client_id>.
+/// \param id The ID of the key to append to.
+/// \param data The data to append to the key.
+/// \param index If this is set, then the data must be appended at this index.
+///        If the current log is shorter or longer than the requested index,
+///        then the append will fail and an error message will be returned as a
+///        string.
+/// \return OK if the append succeeds, or an error message string if the append
+///         fails.
+int TableAppend_RedisCommand(RedisModuleCtx *ctx, RedisModuleString **argv, int argc) {
+  RedisModule_AutoMemory(ctx);
+  const int status = TableAppend_DoWrite(ctx, argv, argc,
+                                         /*mutated_key_str=*/nullptr);
+  if (status) {
+    return status;
+  }
+  return TableAppend_DoPublish(ctx, argv, argc);
+}
+
+#if RAY_USE_NEW_GCS
+int ChainTableAppend_RedisCommand(RedisModuleCtx *ctx, RedisModuleString **argv,
+                                  int argc) {
+  RedisModule_AutoMemory(ctx);
+  return module.ChainReplicate(ctx, argv, argc,
+                               /*node_func=*/TableAppend_DoWrite,
+                               /*tail_func=*/TableAppend_DoPublish);
+}
+#endif
+
+/// A helper function to create and finish a GcsTableEntry, based on the
+/// current value or values at the given key.
+void TableEntryToFlatbuf(RedisModuleKey *table_key, RedisModuleString *entry_id,
+                         flatbuffers::FlatBufferBuilder &fbb) {
+  auto key_type = RedisModule_KeyType(table_key);
+  switch (key_type) {
+  case REDISMODULE_KEYTYPE_STRING: {
+    // Build the flatbuffer from the string data.
+    size_t data_len = 0;
+    char *data_buf = RedisModule_StringDMA(table_key, &data_len, REDISMODULE_READ);
+    auto data = fbb.CreateString(data_buf, data_len);
+    auto message = CreateGcsTableEntry(fbb, RedisStringToFlatbuf(fbb, entry_id),
+                                       fbb.CreateVector(&data, 1));
+    fbb.Finish(message);
+  } break;
+  case REDISMODULE_KEYTYPE_ZSET: {
+    // Build the flatbuffer from the set of log entries.
+    RAY_CHECK(RedisModule_ZsetFirstInScoreRange(table_key, REDISMODULE_NEGATIVE_INFINITE,
+                                                REDISMODULE_POSITIVE_INFINITE, 1,
+                                                1) == REDISMODULE_OK);
+    std::vector<flatbuffers::Offset<flatbuffers::String>> data;
+    for (; !RedisModule_ZsetRangeEndReached(table_key);
+         RedisModule_ZsetRangeNext(table_key)) {
+      data.push_back(RedisStringToFlatbuf(
+          fbb, RedisModule_ZsetRangeCurrentElement(table_key, NULL)));
+    }
+    auto message = CreateGcsTableEntry(fbb, RedisStringToFlatbuf(fbb, entry_id),
+                                       fbb.CreateVector(data));
+    fbb.Finish(message);
+  } break;
+  case REDISMODULE_KEYTYPE_EMPTY: {
+    auto message = CreateGcsTableEntry(
+        fbb, RedisStringToFlatbuf(fbb, entry_id),
+        fbb.CreateVector(std::vector<flatbuffers::Offset<flatbuffers::String>>()));
+    fbb.Finish(message);
+  } break;
+  default:
+    RAY_LOG(FATAL) << "Invalid Redis type during lookup: " << key_type;
+  }
+}
+
+/// Lookup the current value or values at a key. Returns the current value or
+/// values at the key.
+///
+/// This is called from a client with the command:
+//
+///    RAY.TABLE_LOOKUP <table_prefix> <pubsub_channel> <id>
+///
+/// \param table_prefix The prefix string for keys in this table.
+/// \param pubsub_channel The pubsub channel name that notifications for
+///        this key should be published to. This field is unused for lookups.
+/// \param id The ID of the key to lookup.
+/// \return nil if the key is empty, the current value if the key type is a
+///         string, or an array of the current values if the key type is a set.
+int TableLookup_RedisCommand(RedisModuleCtx *ctx, RedisModuleString **argv, int argc) {
+  RedisModule_AutoMemory(ctx);
+
+  if (argc < 4) {
+    return RedisModule_WrongArity(ctx);
+  }
+
+  RedisModuleString *prefix_str = argv[1];
+  RedisModuleString *id = argv[3];
+
+  // Lookup the data at the key.
+  RedisModuleKey *table_key = OpenPrefixedKey(ctx, prefix_str, id, REDISMODULE_READ);
+  if (table_key == nullptr) {
+    RedisModule_ReplyWithNull(ctx);
+  } else {
+    // Serialize the data to a flatbuffer to return to the client.
+    flatbuffers::FlatBufferBuilder fbb;
+    TableEntryToFlatbuf(table_key, id, fbb);
+    RedisModule_ReplyWithStringBuffer(
+        ctx, reinterpret_cast<const char *>(fbb.GetBufferPointer()), fbb.GetSize());
+  }
+  return REDISMODULE_OK;
+}
+
+/// Request notifications for changes to a key. Returns the current value or
+/// values at the key. Notifications will be sent to the requesting client for
+/// every subsequent TABLE_ADD to the key.
+///
+/// This is called from a client with the command:
+//
+///    RAY.TABLE_REQUEST_NOTIFICATIONS <table_prefix> <pubsub_channel> <id>
+///        <client_id>
+///
+/// \param table_prefix The prefix string for keys in this table.
+/// \param pubsub_channel The pubsub channel name that notifications for
+///        this key should be published to. When publishing to a specific
+///        client, the channel name should be <pubsub_channel>:<client_id>.
+/// \param id The ID of the key to publish notifications for.
+/// \param client_id The ID of the client that is being notified.
+/// \return nil if the key is empty, the current value if the key type is a
+///         string, or an array of the current values if the key type is a set.
+int TableRequestNotifications_RedisCommand(RedisModuleCtx *ctx, RedisModuleString **argv,
+                                           int argc) {
+  RedisModule_AutoMemory(ctx);
+
+  if (argc != 5) {
+    return RedisModule_WrongArity(ctx);
+  }
+
+  RedisModuleString *prefix_str = argv[1];
+  RedisModuleString *pubsub_channel_str = argv[2];
+  RedisModuleString *id = argv[3];
+  RedisModuleString *client_id = argv[4];
+  RedisModuleString *client_channel =
+      FormatPubsubChannel(ctx, pubsub_channel_str, client_id);
+
+  // Add this client to the set of clients that should be notified when there
+  // are changes to the key.
+  RedisModuleKey *notification_key =
+      OpenBroadcastKey(ctx, pubsub_channel_str, id, REDISMODULE_READ | REDISMODULE_WRITE);
+  CHECK_ERROR(RedisModule_ZsetAdd(notification_key, 0.0, client_channel, NULL),
+              "ZsetAdd failed.");
+
+  // Lookup the current value at the key.
+  RedisModuleKey *table_key = OpenPrefixedKey(ctx, prefix_str, id, REDISMODULE_READ);
+  // Publish the current value at the key to the client that is requesting
+  // notifications. An empty notification will be published if the key is
+  // empty.
+  flatbuffers::FlatBufferBuilder fbb;
+  TableEntryToFlatbuf(table_key, id, fbb);
+  RedisModule_Call(ctx, "PUBLISH", "sb", client_channel,
+                   reinterpret_cast<const char *>(fbb.GetBufferPointer()), fbb.GetSize());
+
+  return RedisModule_ReplyWithNull(ctx);
+}
+
+/// Cancel notifications for changes to a key. The client will no longer
+/// receive notifications for this key. This does not check if the client
+/// first requested notifications before canceling them.
+///
+/// This is called from a client with the command:
+//
+///    RAY.TABLE_CANCEL_NOTIFICATIONS <table_prefix> <pubsub_channel> <id>
+///        <client_id>
+///
+/// \param table_prefix The prefix string for keys in this table.
+/// \param pubsub_channel The pubsub channel name that notifications for
+///        this key should be published to. If publishing to a specific client,
+///        then the channel name should be <pubsub_channel>:<client_id>.
+/// \param id The ID of the key to publish notifications for.
+/// \param client_id The ID of the client to cancel notifications for.
+/// \return OK.
+int TableCancelNotifications_RedisCommand(RedisModuleCtx *ctx, RedisModuleString **argv,
+                                          int argc) {
+  RedisModule_AutoMemory(ctx);
+
+  if (argc < 5) {
+    return RedisModule_WrongArity(ctx);
+  }
+
+  RedisModuleString *pubsub_channel_str = argv[2];
+  RedisModuleString *id = argv[3];
+  RedisModuleString *client_id = argv[4];
+  RedisModuleString *client_channel =
+      FormatPubsubChannel(ctx, pubsub_channel_str, client_id);
+
+  // Remove this client from the set of clients that should be notified when
+  // there are changes to the key.
+  RedisModuleKey *notification_key =
+      OpenBroadcastKey(ctx, pubsub_channel_str, id, REDISMODULE_READ | REDISMODULE_WRITE);
+  if (RedisModule_KeyType(notification_key) != REDISMODULE_KEYTYPE_EMPTY) {
+    RAY_CHECK(RedisModule_ZsetRem(notification_key, client_channel, NULL) ==
+              REDISMODULE_OK);
+    size_t size = RedisModule_ValueLength(notification_key);
+    if (size == 0) {
+      CHECK_ERROR(RedisModule_DeleteKey(notification_key), "Unable to delete zset key.");
+    }
+  }
+
+  RedisModule_ReplyWithSimpleString(ctx, "OK");
+  return REDISMODULE_OK;
+}
+
+bool is_nil(const std::string &data) {
+  RAY_CHECK(data.size() == kUniqueIDSize);
+  const uint8_t *d = reinterpret_cast<const uint8_t *>(data.data());
+  for (int i = 0; i < kUniqueIDSize; ++i) {
+    if (d[i] != 255) {
+      return false;
+    }
+  }
+  return true;
+}
+
+// This is a temporary redis command that will be removed once
+// the GCS uses https://github.com/pcmoritz/credis.
+// Be careful, this only supports Task Table payloads.
+int TableTestAndUpdate_RedisCommand(RedisModuleCtx *ctx, RedisModuleString **argv,
+                                    int argc) {
+  RedisModule_AutoMemory(ctx);
+
+  if (argc != 5) {
+    return RedisModule_WrongArity(ctx);
+  }
+  RedisModuleString *prefix_str = argv[1];
+  RedisModuleString *id = argv[3];
+  RedisModuleString *update_data = argv[4];
+
+  RedisModuleKey *key =
+      OpenPrefixedKey(ctx, prefix_str, id, REDISMODULE_READ | REDISMODULE_WRITE);
+
+  size_t value_len = 0;
+  char *value_buf = RedisModule_StringDMA(key, &value_len, REDISMODULE_READ);
+
+  size_t update_len = 0;
+  const char *update_buf = RedisModule_StringPtrLen(update_data, &update_len);
+
+  auto data =
+      flatbuffers::GetMutableRoot<TaskTableData>(reinterpret_cast<void *>(value_buf));
+
+  auto update = flatbuffers::GetRoot<TaskTableTestAndUpdate>(update_buf);
+
+  bool do_update = static_cast<int>(data->scheduling_state()) &
+                   static_cast<int>(update->test_state_bitmask());
+
+  if (!is_nil(update->test_scheduler_id()->str())) {
+    do_update =
+        do_update && update->test_scheduler_id()->str() == data->scheduler_id()->str();
+  }
+
+  if (do_update) {
+    RAY_CHECK(data->mutate_scheduling_state(update->update_state()));
+  }
+  RAY_CHECK(data->mutate_updated(do_update));
+
+  int result = RedisModule_ReplyWithStringBuffer(ctx, value_buf, value_len);
+
+  return result;
+}
+
+extern "C" {
+
+/* This function must be present on each Redis module. It is used in order to
+ * register the commands into the Redis server. */
+int RedisModule_OnLoad(RedisModuleCtx *ctx, RedisModuleString **argv, int argc) {
+  REDISMODULE_NOT_USED(argv);
+  REDISMODULE_NOT_USED(argc);
+
+  if (RedisModule_Init(ctx, "ray", 1, REDISMODULE_APIVER_1) == REDISMODULE_ERR) {
+    return REDISMODULE_ERR;
+  }
+
+  if (RedisModule_CreateCommand(ctx, "ray.table_add", TableAdd_RedisCommand,
+                                "write pubsub", 0, 0, 0) == REDISMODULE_ERR) {
+    return REDISMODULE_ERR;
+  }
+
+  if (RedisModule_CreateCommand(ctx, "ray.table_append", TableAppend_RedisCommand,
+                                "write", 0, 0, 0) == REDISMODULE_ERR) {
+    return REDISMODULE_ERR;
+  }
+
+  if (RedisModule_CreateCommand(ctx, "ray.table_lookup", TableLookup_RedisCommand,
+                                "readonly", 0, 0, 0) == REDISMODULE_ERR) {
+    return REDISMODULE_ERR;
+  }
+
+  if (RedisModule_CreateCommand(ctx, "ray.table_request_notifications",
+                                TableRequestNotifications_RedisCommand, "write pubsub", 0,
+                                0, 0) == REDISMODULE_ERR) {
+    return REDISMODULE_ERR;
+  }
+
+  if (RedisModule_CreateCommand(ctx, "ray.table_cancel_notifications",
+                                TableCancelNotifications_RedisCommand, "write pubsub", 0,
+                                0, 0) == REDISMODULE_ERR) {
+    return REDISMODULE_ERR;
+  }
+
+  if (RedisModule_CreateCommand(ctx, "ray.table_test_and_update",
+                                TableTestAndUpdate_RedisCommand, "write", 0, 0,
+                                0) == REDISMODULE_ERR) {
+    return REDISMODULE_ERR;
+  }
+
+#if RAY_USE_NEW_GCS
+  // Chain-enabled commands that depend on ray-project/credis.
+  if (RedisModule_CreateCommand(ctx, "ray.chain.table_add", ChainTableAdd_RedisCommand,
+                                "write pubsub", 0, 0, 0) == REDISMODULE_ERR) {
+    return REDISMODULE_ERR;
+  }
+  if (RedisModule_CreateCommand(ctx, "ray.chain.table_append",
+                                ChainTableAppend_RedisCommand, "write pubsub", 0, 0,
+                                0) == REDISMODULE_ERR) {
+    return REDISMODULE_ERR;
+  }
+#endif
+
+  return REDISMODULE_OK;
+}
+
+} /* extern "C" */
diff --git a/src/common/redis_module/redis_string.h b/src/ray/gcs/redis_module/redis_string.h
similarity index 91%
rename from src/common/redis_module/redis_string.h
rename to src/ray/gcs/redis_module/redis_string.h
index edb41930b2f85..3755b3f3aa741 100644
--- a/src/common/redis_module/redis_string.h
+++ b/src/ray/gcs/redis_module/redis_string.h
@@ -16,9 +16,7 @@
  * @params ... The parameters to be formated.
  * @return The formatted RedisModuleString, needs to be freed by the caller.
  */
-RedisModuleString *RedisString_Format(RedisModuleCtx *ctx,
-                                      const char *fmt,
-                                      ...) {
+RedisModuleString *RedisString_Format(RedisModuleCtx *ctx, const char *fmt, ...) {
   RedisModuleString *result = RedisModule_CreateString(ctx, "", 0);
   size_t initlen = strlen(fmt);
   size_t l;
diff --git a/src/common/redis_module/redismodule.h b/src/ray/gcs/redis_module/redismodule.h
similarity index 100%
rename from src/common/redis_module/redismodule.h
rename to src/ray/gcs/redis_module/redismodule.h
diff --git a/src/ray/gcs/tables.cc b/src/ray/gcs/tables.cc
index ba06248144749..c6c12aa53069c 100644
--- a/src/ray/gcs/tables.cc
+++ b/src/ray/gcs/tables.cc
@@ -1,6 +1,6 @@
 #include "ray/gcs/tables.h"
 
-#include "common_protocol.h"
+#include "ray/common/common_protocol.h"
 #include "ray/gcs/client.h"
 
 namespace {
@@ -38,6 +38,7 @@ namespace gcs {
 template <typename ID, typename Data>
 Status Log<ID, Data>::Append(const JobID &job_id, const ID &id,
                              std::shared_ptr<DataT> &dataT, const WriteCallback &done) {
+  num_appends_++;
   auto callback = [this, id, dataT, done](const std::string &data) {
     if (done != nullptr) {
       (done)(client_, id, *dataT);
@@ -56,6 +57,7 @@ template <typename ID, typename Data>
 Status Log<ID, Data>::AppendAt(const JobID &job_id, const ID &id,
                                std::shared_ptr<DataT> &dataT, const WriteCallback &done,
                                const WriteCallback &failure, int log_length) {
+  num_appends_++;
   auto callback = [this, id, dataT, done, failure](const std::string &data) {
     if (data.empty()) {
       if (done != nullptr) {
@@ -78,6 +80,7 @@ Status Log<ID, Data>::AppendAt(const JobID &job_id, const ID &id,
 
 template <typename ID, typename Data>
 Status Log<ID, Data>::Lookup(const JobID &job_id, const ID &id, const Callback &lookup) {
+  num_lookups_++;
   auto callback = [this, id, lookup](const std::string &data) {
     if (lookup != nullptr) {
       std::vector<DataT> results;
@@ -164,9 +167,17 @@ Status Log<ID, Data>::CancelNotifications(const JobID &job_id, const ID &id,
                                        pubsub_channel_, nullptr);
 }
 
+template <typename ID, typename Data>
+std::string Log<ID, Data>::DebugString() const {
+  std::stringstream result;
+  result << "num lookups: " << num_lookups_ << ", num appends: " << num_appends_;
+  return result.str();
+}
+
 template <typename ID, typename Data>
 Status Table<ID, Data>::Add(const JobID &job_id, const ID &id,
                             std::shared_ptr<DataT> &dataT, const WriteCallback &done) {
+  num_adds_++;
   auto callback = [this, id, dataT, done](const std::string &data) {
     if (done != nullptr) {
       (done)(client_, id, *dataT);
@@ -184,6 +195,7 @@ Status Table<ID, Data>::Add(const JobID &job_id, const ID &id,
 template <typename ID, typename Data>
 Status Table<ID, Data>::Lookup(const JobID &job_id, const ID &id, const Callback &lookup,
                                const FailureCallback &failure) {
+  num_lookups_++;
   return Log<ID, Data>::Lookup(job_id, id,
                                [lookup, failure](AsyncGcsClient *client, const ID &id,
                                                  const std::vector<DataT> &data) {
@@ -221,6 +233,13 @@ Status Table<ID, Data>::Subscribe(const JobID &job_id, const ClientID &client_id
       done);
 }
 
+template <typename ID, typename Data>
+std::string Table<ID, Data>::DebugString() const {
+  std::stringstream result;
+  result << "num lookups: " << num_lookups_ << ", num adds: " << num_adds_;
+  return result.str();
+}
+
 Status ErrorTable::PushErrorToDriver(const JobID &job_id, const std::string &type,
                                      const std::string &error_message, double timestamp) {
   auto data = std::make_shared<ErrorTableDataT>();
@@ -234,6 +253,10 @@ Status ErrorTable::PushErrorToDriver(const JobID &job_id, const std::string &typ
   });
 }
 
+std::string ErrorTable::DebugString() const {
+  return Log<JobID, ErrorTableData>::DebugString();
+}
+
 Status ProfileTable::AddProfileEvent(const std::string &event_type,
                                      const std::string &component_type,
                                      const UniqueID &component_id,
@@ -273,6 +296,10 @@ Status ProfileTable::AddProfileEventBatch(const ProfileTableData &profile_events
                 });
 }
 
+std::string ProfileTable::DebugString() const {
+  return Log<UniqueID, ProfileTableData>::DebugString();
+}
+
 Status DriverTable::AppendDriverData(const JobID &driver_id, bool is_dead) {
   auto data = std::make_shared<DriverTableDataT>();
   data->driver_id = driver_id.binary();
@@ -421,15 +448,14 @@ ray::Status ClientTable::MarkDisconnected(const ClientID &dead_client_id) {
   return Append(JobID::nil(), client_log_key_, data, nullptr);
 }
 
-const ClientTableDataT &ClientTable::GetClient(const ClientID &client_id) const {
+void ClientTable::GetClient(const ClientID &client_id,
+                            ClientTableDataT &client_info) const {
   RAY_CHECK(!client_id.is_nil());
   auto entry = client_cache_.find(client_id);
   if (entry != client_cache_.end()) {
-    return entry->second;
+    client_info = entry->second;
   } else {
-    // If the requested client was not found, return a reference to the nil
-    // client entry.
-    return client_cache_.at(ClientID::nil());
+    client_info.client_id = ClientID::nil().binary();
   }
 }
 
@@ -437,6 +463,14 @@ const std::unordered_map<ClientID, ClientTableDataT> &ClientTable::GetAllClients
   return client_cache_;
 }
 
+std::string ClientTable::DebugString() const {
+  std::stringstream result;
+  result << Log<UniqueID, ClientTableData>::DebugString();
+  result << ", cache size: " << client_cache_.size()
+         << ", num removed: " << removed_clients_.size();
+  return result.str();
+}
+
 template class Log<ObjectID, ObjectTableData>;
 template class Log<TaskID, ray::protocol::Task>;
 template class Table<TaskID, ray::protocol::Task>;
@@ -445,6 +479,7 @@ template class Log<ActorID, ActorTableData>;
 template class Log<TaskID, TaskReconstructionData>;
 template class Table<TaskID, TaskLeaseData>;
 template class Table<ClientID, HeartbeatTableData>;
+template class Table<ClientID, HeartbeatBatchTableData>;
 template class Log<JobID, ErrorTableData>;
 template class Log<UniqueID, ClientTableData>;
 template class Log<JobID, DriverTableData>;
diff --git a/src/ray/gcs/tables.h b/src/ray/gcs/tables.h
index e2f022502f097..5cca066fb453c 100644
--- a/src/ray/gcs/tables.h
+++ b/src/ray/gcs/tables.h
@@ -16,11 +16,6 @@
 // TODO(rkn): Remove this include.
 #include "ray/raylet/format/node_manager_generated.h"
 
-// TODO(pcm): Remove this
-// TODO: While removing "task.h", remove the dependency gen_common_python_fbs
-//       from src/ray/CMakeLists.txt.
-#include "task.h"
-
 struct redisAsyncContext;
 
 namespace ray {
@@ -189,6 +184,11 @@ class Log : public LogInterface<ID, Data>, virtual public PubsubInterface<ID> {
   Status CancelNotifications(const JobID &job_id, const ID &id,
                              const ClientID &client_id);
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  protected:
   std::shared_ptr<RedisContext> GetRedisContext(const ID &id) {
     static std::hash<ray::UniqueID> index;
@@ -213,6 +213,10 @@ class Log : public LogInterface<ID, Data>, virtual public PubsubInterface<ID> {
 
   /// Commands to a GCS table can either be regular (default) or chain-replicated.
   CommandType command_type_ = CommandType::kRegular;
+
+ private:
+  int64_t num_appends_ = 0;
+  int64_t num_lookups_ = 0;
 };
 
 template <typename ID, typename Data>
@@ -300,6 +304,11 @@ class Table : private Log<ID, Data>,
                    const Callback &subscribe, const FailureCallback &failure,
                    const SubscriptionCallback &done);
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  protected:
   using Log<ID, Data>::shard_contexts_;
   using Log<ID, Data>::client_;
@@ -307,6 +316,10 @@ class Table : private Log<ID, Data>,
   using Log<ID, Data>::prefix_;
   using Log<ID, Data>::command_type_;
   using Log<ID, Data>::GetRedisContext;
+
+ private:
+  int64_t num_adds_ = 0;
+  int64_t num_lookups_ = 0;
 };
 
 class ObjectTable : public Log<ObjectID, ObjectTableData> {
@@ -338,6 +351,17 @@ class HeartbeatTable : public Table<ClientID, HeartbeatTableData> {
   virtual ~HeartbeatTable() {}
 };
 
+class HeartbeatBatchTable : public Table<ClientID, HeartbeatBatchTableData> {
+ public:
+  HeartbeatBatchTable(const std::vector<std::shared_ptr<RedisContext>> &contexts,
+                      AsyncGcsClient *client)
+      : Table(contexts, client) {
+    pubsub_channel_ = TablePubsub::HEARTBEAT_BATCH;
+    prefix_ = TablePrefix::HEARTBEAT_BATCH;
+  }
+  virtual ~HeartbeatBatchTable() {}
+};
+
 class DriverTable : public Log<JobID, DriverTableData> {
  public:
   DriverTable(const std::vector<std::shared_ptr<RedisContext>> &contexts,
@@ -346,6 +370,7 @@ class DriverTable : public Log<JobID, DriverTableData> {
     pubsub_channel_ = TablePubsub::DRIVER;
     prefix_ = TablePrefix::DRIVER;
   };
+
   virtual ~DriverTable() {}
 
   /// Appends driver data to the driver table.
@@ -434,91 +459,6 @@ class TaskTable : public Table<TaskID, ray::protocol::Task> {
 
 }  // namespace raylet
 
-class TaskTable : public Table<TaskID, TaskTableData> {
- public:
-  TaskTable(const std::vector<std::shared_ptr<RedisContext>> &contexts,
-            AsyncGcsClient *client)
-      : Table(contexts, client) {
-    pubsub_channel_ = TablePubsub::TASK;
-    prefix_ = TablePrefix::TASK;
-  };
-
-  TaskTable(const std::vector<std::shared_ptr<RedisContext>> &contexts,
-            AsyncGcsClient *client, gcs::CommandType command_type)
-      : TaskTable(contexts, client) {
-    command_type_ = command_type;
-  }
-
-  using TestAndUpdateCallback =
-      std::function<void(AsyncGcsClient *client, const TaskID &id,
-                         const TaskTableDataT &task, bool updated)>;
-  using SubscribeToTaskCallback =
-      std::function<void(std::shared_ptr<TaskTableDataT> task)>;
-  /// Update a task's scheduling information in the task table, if the current
-  /// value matches the given test value. If the update succeeds, it also
-  /// updates
-  /// the task entry's local scheduler ID with the ID of the client who called
-  /// this function. This assumes that the task spec already exists in the task
-  /// table entry.
-  ///
-  /// \param task_id The task ID of the task entry to update.
-  /// \param test_state_bitmask The bitmask to apply to the task entry's current
-  /// scheduling state.  The update happens if and only if the current
-  /// scheduling state AND-ed with the bitmask is greater than 0.
-  /// \param update_state The value to update the task entry's scheduling state
-  /// with, if the current state matches test_state_bitmask.
-  /// \param callback Function to be called when database returns result.
-  /// \return Status
-  Status TestAndUpdate(const JobID &job_id, const TaskID &id,
-                       std::shared_ptr<TaskTableTestAndUpdateT> data,
-                       const TestAndUpdateCallback &callback) {
-    auto redisCallback = [this, callback, id](const std::string &data) {
-      auto result = std::make_shared<TaskTableDataT>();
-      auto root = flatbuffers::GetRoot<TaskTableData>(data.data());
-      root->UnPackTo(result.get());
-      callback(client_, id, *result, root->updated());
-      return true;
-    };
-    flatbuffers::FlatBufferBuilder fbb;
-    fbb.Finish(TaskTableTestAndUpdate::Pack(fbb, data.get()));
-    for (auto context : shard_contexts_) {
-      RAY_RETURN_NOT_OK(context->RunAsync("RAY.TABLE_TEST_AND_UPDATE", id,
-                                          fbb.GetBufferPointer(), fbb.GetSize(), prefix_,
-                                          pubsub_channel_, redisCallback));
-    }
-    return Status::OK();
-  }
-
-  /// This has a separate signature from Subscribe in Table
-  /// Register a callback for a task event. An event is any update of a task in
-  /// the task table.
-  /// Events include changes to the task's scheduling state or changes to the
-  /// task's local scheduler ID.
-  ///
-  /// \param local_scheduler_id The db_client_id of the local scheduler whose
-  /// events we want to listen to. If you want to subscribe to updates from
-  /// all local schedulers, pass in NIL_ID.
-  /// \param subscribe_callback Callback that will be called when the task table
-  /// is updated.
-  /// \param state_filter Events we want to listen to. Can have values from the
-  /// enum "scheduling_state" in task.h.
-  /// TODO(pcm): Make it possible to combine these using flags like
-  /// TASK_STATUS_WAITING | TASK_STATUS_SCHEDULED.
-  /// \param callback Function to be called when database returns result.
-  /// \return Status
-  Status SubscribeToTask(const JobID &job_id, const ClientID &local_scheduler_id,
-                         int state_filter, const SubscribeToTaskCallback &callback,
-                         const Callback &done);
-};
-
-Status TaskTableAdd(AsyncGcsClient *gcs_client, Task *task);
-
-Status TaskTableTestAndUpdate(AsyncGcsClient *gcs_client, const TaskID &task_id,
-                              const ClientID &local_scheduler_id,
-                              SchedulingState test_state_bitmask,
-                              SchedulingState update_state,
-                              const TaskTable::TestAndUpdateCallback &callback);
-
 class ErrorTable : private Log<JobID, ErrorTableData> {
  public:
   ErrorTable(const std::vector<std::shared_ptr<RedisContext>> &contexts,
@@ -542,6 +482,11 @@ class ErrorTable : private Log<JobID, ErrorTableData> {
   /// \return Status.
   Status PushErrorToDriver(const JobID &job_id, const std::string &type,
                            const std::string &error_message, double timestamp);
+
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
 };
 
 class ProfileTable : private Log<UniqueID, ProfileTableData> {
@@ -574,6 +519,11 @@ class ProfileTable : private Log<UniqueID, ProfileTableData> {
   /// \param profile_events The profile events to record.
   /// \return Status.
   Status AddProfileEventBatch(const ProfileTableData &profile_events);
+
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
 };
 
 using CustomSerializerTable = Table<ClassID, CustomSerializerData>;
@@ -607,12 +557,6 @@ class ClientTable : private Log<UniqueID, ClientTableData> {
 
     // Set the local client's ID.
     local_client_.client_id = client_id.binary();
-
-    // Add a nil client to the cache so that we can serve requests for clients
-    // that we have not heard about.
-    ClientTableDataT nil_client;
-    nil_client.client_id = ClientID::nil().binary();
-    client_cache_[ClientID::nil()] = nil_client;
   };
 
   /// Connect as a client to the GCS. This registers us in the client table
@@ -650,9 +594,11 @@ class ClientTable : private Log<UniqueID, ClientTableData> {
   /// information for clients that we've heard a notification for.
   ///
   /// \param client The client to get information about.
-  /// \return A reference to the requested client. If the client is not in the
-  /// cache, then an entry with a nil ClientID will be returned.
-  const ClientTableDataT &GetClient(const ClientID &client) const;
+  /// \param A reference to the client information. If we have information
+  /// about the client in the cache, then the reference will be modified to
+  /// contain that information. Else, the reference will be updated to contain
+  /// a nil client ID.
+  void GetClient(const ClientID &client, ClientTableDataT &client_info) const;
 
   /// Get the local client's ID.
   ///
@@ -677,6 +623,11 @@ class ClientTable : private Log<UniqueID, ClientTableData> {
   /// \return The client ID to client information map.
   const std::unordered_map<ClientID, ClientTableDataT> &GetAllClients() const;
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  private:
   /// Handle a client table notification.
   void HandleNotification(AsyncGcsClient *client, const ClientTableDataT &notifications);
diff --git a/src/ray/gcs/task_table.cc b/src/ray/gcs/task_table.cc
deleted file mode 100644
index 3ee01f19c9d82..0000000000000
--- a/src/ray/gcs/task_table.cc
+++ /dev/null
@@ -1,71 +0,0 @@
-#include "ray/gcs/tables.h"
-
-#include "ray/gcs/client.h"
-#include "ray/id.h"
-
-#include "common_protocol.h"
-#include "task.h"
-
-// TODO(swang): This file extends tables.cc so that we can separate out the
-// part that depends on the legacy Task* data structure from the build. This
-// should be merged with tables.cc once we get rid of the legacy Task*
-// datastructure.
-
-namespace {
-
-std::shared_ptr<TaskTableDataT> MakeTaskTableData(const TaskExecutionSpec &execution_spec,
-                                                  const ClientID &local_scheduler_id,
-                                                  SchedulingState scheduling_state) {
-  auto data = std::make_shared<TaskTableDataT>();
-  data->scheduling_state = scheduling_state;
-  data->task_info = std::string(execution_spec.Spec(), execution_spec.SpecSize());
-  data->scheduler_id = local_scheduler_id.binary();
-
-  flatbuffers::FlatBufferBuilder fbb;
-  auto execution_dependencies = CreateTaskExecutionDependencies(
-      fbb, to_flatbuf(fbb, execution_spec.ExecutionDependencies()));
-  fbb.Finish(execution_dependencies);
-
-  data->execution_dependencies =
-      std::string((const char *)fbb.GetBufferPointer(), fbb.GetSize());
-  data->spillback_count = execution_spec.SpillbackCount();
-
-  return data;
-}
-
-}  // namespace
-
-namespace ray {
-
-namespace gcs {
-
-// TODO(pcm): This is a helper method that should go away once we get rid of
-// the Task* datastructure and replace it with TaskTableDataT.
-Status TaskTableAdd(AsyncGcsClient *gcs_client, Task *task) {
-  TaskExecutionSpec &execution_spec = *Task_task_execution_spec(task);
-  TaskSpec *spec = execution_spec.Spec();
-  auto data = MakeTaskTableData(execution_spec, Task_local_scheduler(task),
-                                static_cast<SchedulingState>(Task_state(task)));
-  return gcs_client->task_table().Add(
-      ray::JobID::nil(), TaskSpec_task_id(spec), data,
-      [](gcs::AsyncGcsClient *client, const TaskID &id, const TaskTableDataT &data) {});
-}
-
-// TODO(pcm): This is a helper method that should go away once we get rid of
-// the Task* datastructure and replace it with TaskTableDataT.
-Status TaskTableTestAndUpdate(AsyncGcsClient *gcs_client, const TaskID &task_id,
-                              const ClientID &local_scheduler_id,
-                              SchedulingState test_state_bitmask,
-                              SchedulingState update_state,
-                              const TaskTable::TestAndUpdateCallback &callback) {
-  auto data = std::make_shared<TaskTableTestAndUpdateT>();
-  data->test_scheduler_id = local_scheduler_id.binary();
-  data->test_state_bitmask = test_state_bitmask;
-  data->update_state = update_state;
-  return gcs_client->task_table().TestAndUpdate(ray::JobID::nil(), task_id, data,
-                                                callback);
-}
-
-}  // namespace gcs
-
-}  // namespace ray
diff --git a/src/ray/id.cc b/src/ray/id.cc
index 0f3eb33f8b32e..95ab1bd640805 100644
--- a/src/ray/id.cc
+++ b/src/ray/id.cc
@@ -6,10 +6,16 @@
 #include <mutex>
 #include <random>
 
-#include "common/common.h"
 #include "ray/constants.h"
 #include "ray/status.h"
 
+extern "C" {
+#include "thirdparty/sha256.h"
+}
+
+// Definitions for computing hash digests.
+#define DIGEST_SIZE SHA256_BLOCK_SIZE
+
 namespace ray {
 
 std::mt19937 RandomlySeededMersenneTwister() {
diff --git a/src/ray/id.h b/src/ray/id.h
index 2f35b151a50ad..daac028fd7a85 100644
--- a/src/ray/id.h
+++ b/src/ray/id.h
@@ -10,10 +10,6 @@
 #include "ray/constants.h"
 #include "ray/util/visibility.h"
 
-extern "C" {
-#include "sha256.h"
-}
-
 namespace ray {
 
 class RAY_EXPORT UniqueID {
diff --git a/src/ray/object_manager/connection_pool.cc b/src/ray/object_manager/connection_pool.cc
index 58508f977b9bb..dcfb2a77bb85a 100644
--- a/src/ray/object_manager/connection_pool.cc
+++ b/src/ray/object_manager/connection_pool.cc
@@ -19,7 +19,7 @@ void ConnectionPool::RegisterReceiver(ConnectionType type, const ClientID &clien
 
 void ConnectionPool::RemoveReceiver(std::shared_ptr<TcpClientConnection> conn) {
   std::unique_lock<std::mutex> guard(connection_mutex);
-  ClientID client_id = conn->GetClientID();
+  const ClientID client_id = conn->GetClientId();
   if (message_receive_connections_.count(client_id) != 0) {
     Remove(message_receive_connections_, client_id, conn);
   }
@@ -38,6 +38,17 @@ void ConnectionPool::RegisterSender(ConnectionType type, const ClientID &client_
   // Don't add to available connections. It will become available once it is released.
 }
 
+void ConnectionPool::RemoveSender(const std::shared_ptr<SenderConnection> &conn) {
+  std::unique_lock<std::mutex> guard(connection_mutex);
+  const ClientID client_id = conn->GetClientId();
+  if (message_send_connections_.count(client_id) != 0) {
+    Remove(message_send_connections_, client_id, conn);
+  }
+  if (transfer_send_connections_.count(client_id) != 0) {
+    Remove(transfer_send_connections_, client_id, conn);
+  }
+}
+
 void ConnectionPool::GetSender(ConnectionType type, const ClientID &client_id,
                                std::shared_ptr<SenderConnection> *conn) {
   std::unique_lock<std::mutex> guard(connection_mutex);
@@ -57,7 +68,7 @@ void ConnectionPool::ReleaseSender(ConnectionType type,
   SenderMapType &conn_map = (type == ConnectionType::MESSAGE)
                                 ? available_message_send_connections_
                                 : available_transfer_send_connections_;
-  Return(conn_map, conn->GetClientID(), conn);
+  Return(conn_map, conn->GetClientId(), conn);
 }
 
 void ConnectionPool::Add(ReceiverMapType &conn_map, const ClientID &client_id,
@@ -79,7 +90,22 @@ void ConnectionPool::Remove(ReceiverMapType &conn_map, const ClientID &client_id
   auto &connections = it->second;
   int64_t pos =
       std::find(connections.begin(), connections.end(), conn) - connections.begin();
-  if (pos >= (int64_t)connections.size()) {
+  if (pos >= static_cast<int64_t>(connections.size())) {
+    return;
+  }
+  connections.erase(connections.begin() + pos);
+}
+
+void ConnectionPool::Remove(SenderMapType &conn_map, const ClientID &client_id,
+                            const std::shared_ptr<SenderConnection> &conn) {
+  auto it = conn_map.find(client_id);
+  if (it == conn_map.end()) {
+    return;
+  }
+  auto &connections = it->second;
+  int64_t pos =
+      std::find(connections.begin(), connections.end(), conn) - connections.begin();
+  if (pos >= static_cast<int64_t>(connections.size())) {
     return;
   }
   connections.erase(connections.begin() + pos);
@@ -107,4 +133,20 @@ void ConnectionPool::Return(SenderMapType &conn_map, const ClientID &client_id,
   RAY_LOG(DEBUG) << "Return " << client_id << " " << conn_map[client_id].size();
 }
 
+std::string ConnectionPool::DebugString() const {
+  std::stringstream result;
+  result << "ConnectionPool:";
+  result << "\n- num message send connections: " << message_send_connections_.size();
+  result << "\n- num transfer send connections: " << transfer_send_connections_.size();
+  result << "\n- num avail message send connections: "
+         << available_transfer_send_connections_.size();
+  result << "\n- num avail transfer send connections: "
+         << available_transfer_send_connections_.size();
+  result << "\n- num message receive connections: "
+         << message_receive_connections_.size();
+  result << "\n- num transfer receive connections: "
+         << transfer_receive_connections_.size();
+  return result.str();
+}
+
 }  // namespace ray
diff --git a/src/ray/object_manager/connection_pool.h b/src/ray/object_manager/connection_pool.h
index 6f96293dcab0b..69fbd5261029f 100644
--- a/src/ray/object_manager/connection_pool.h
+++ b/src/ray/object_manager/connection_pool.h
@@ -57,6 +57,11 @@ class ConnectionPool {
   void RegisterSender(ConnectionType type, const ClientID &client_id,
                       std::shared_ptr<SenderConnection> &conn);
 
+  /// Remove a sender connection.
+  ///
+  /// \param conn The actual connection.
+  void RemoveSender(const std::shared_ptr<SenderConnection> &conn);
+
   /// Get a sender connection from the connection pool.
   /// The connection must be released or removed when the operation for which the
   /// connection was obtained is completed. If the connection pool is empty, the
@@ -85,6 +90,11 @@ class ConnectionPool {
   /// \return Status of invoking this method.
   ray::Status RemoveSender(ConnectionType type, std::shared_ptr<SenderConnection> conn);
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
   /// This object cannot be copied for thread-safety.
   RAY_DISALLOW_COPY_AND_ASSIGN(ConnectionPool);
 
@@ -108,6 +118,10 @@ class ConnectionPool {
   void Remove(ReceiverMapType &conn_map, const ClientID &client_id,
               std::shared_ptr<TcpClientConnection> &conn);
 
+  /// Removes the given sender for ClientID from the given map.
+  void Remove(SenderMapType &conn_map, const ClientID &client_id,
+              const std::shared_ptr<SenderConnection> &conn);
+
   /// Returns the count of sender connections to ClientID.
   uint64_t Count(SenderMapType &conn_map, const ClientID &client_id);
 
diff --git a/src/ray/object_manager/format/object_manager.fbs b/src/ray/object_manager/format/object_manager.fbs
index 008ce97867144..4b684ff89a712 100644
--- a/src/ray/object_manager/format/object_manager.fbs
+++ b/src/ray/object_manager/format/object_manager.fbs
@@ -1,6 +1,30 @@
 // Object Manager protocol specification
 namespace ray.object_manager.protocol;
 
+// Object information data structure.
+// NOTE(pcm): This structure is replicated in
+// https://github.com/apache/arrow/blob/master/cpp/src/plasma/format/common.fbs,
+// so if you modify it, you should also modify that one.
+table ObjectInfo {
+  // Object ID of this object.
+  object_id: string;
+  // Number of bytes the content of this object occupies in memory.
+  data_size: long;
+  // Number of bytes the metadata of this object occupies in memory.
+  metadata_size: long;
+  // Number of clients using the objects.
+  ref_count: int;
+  // Unix epoch of when this object was created.
+  create_time: long;
+  // How long creation of this object took.
+  construct_duration: long;
+  // Hash of the object content. If the object is not sealed yet this is
+  // an empty string.
+  digest: string;
+  // Specifies if this object was deleted or added.
+  is_deletion: bool;
+}
+
 enum MessageType:int {
   ConnectClient = 1,
   PushRequest,
diff --git a/src/ray/object_manager/object_buffer_pool.cc b/src/ray/object_manager/object_buffer_pool.cc
index fdb3623592ebf..5f101e7959202 100644
--- a/src/ray/object_manager/object_buffer_pool.cc
+++ b/src/ray/object_manager/object_buffer_pool.cc
@@ -150,6 +150,7 @@ void ObjectBufferPool::SealChunk(const ObjectID &object_id, const uint64_t chunk
             CreateChunkState::REFERENCED);
   create_buffer_state_[object_id].chunk_state[chunk_index] = CreateChunkState::SEALED;
   create_buffer_state_[object_id].num_seals_remaining--;
+  RAY_CHECK(create_buffer_state_[object_id].num_seals_remaining >= 0);
   RAY_LOG(DEBUG) << "SealChunk" << object_id << " "
                  << create_buffer_state_[object_id].num_seals_remaining;
   if (create_buffer_state_[object_id].num_seals_remaining == 0) {
@@ -194,4 +195,12 @@ void ObjectBufferPool::FreeObjects(const std::vector<ObjectID> &object_ids) {
   ARROW_CHECK_OK(store_client_.Delete(plasma_ids));
 }
 
+std::string ObjectBufferPool::DebugString() const {
+  std::stringstream result;
+  result << "BufferPool:";
+  result << "\n- get buffer state map size: " << get_buffer_state_.size();
+  result << "\n- create buffer state map size: " << create_buffer_state_.size();
+  return result.str();
+}
+
 }  // namespace ray
diff --git a/src/ray/object_manager/object_buffer_pool.h b/src/ray/object_manager/object_buffer_pool.h
index 9fe347451e5b3..ed6594ed4b496 100644
--- a/src/ray/object_manager/object_buffer_pool.h
+++ b/src/ray/object_manager/object_buffer_pool.h
@@ -129,6 +129,11 @@ class ObjectBufferPool {
   /// \return Void.
   void FreeObjects(const std::vector<ObjectID> &object_ids);
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  private:
   /// Abort the create operation associated with an object. This destroys the buffer
   /// state, including create operations in progress for all chunks of the object.
diff --git a/src/ray/object_manager/object_directory.cc b/src/ray/object_manager/object_directory.cc
index 38c7cdd45ca39..ab20d27b66c61 100644
--- a/src/ray/object_manager/object_directory.cc
+++ b/src/ray/object_manager/object_directory.cc
@@ -2,8 +2,9 @@
 
 namespace ray {
 
-ObjectDirectory::ObjectDirectory(std::shared_ptr<gcs::AsyncGcsClient> &gcs_client)
-    : gcs_client_(gcs_client) {}
+ObjectDirectory::ObjectDirectory(boost::asio::io_service &io_service,
+                                 std::shared_ptr<gcs::AsyncGcsClient> &gcs_client)
+    : io_service_(io_service), gcs_client_(gcs_client) {}
 
 namespace {
 
@@ -61,6 +62,8 @@ void ObjectDirectory::RegisterBackend() {
     // empty, since this may indicate that the objects have been evicted from
     // all nodes.
     for (const auto &callback_pair : callbacks) {
+      // It is safe to call the callback directly since this is already running
+      // in the subscription callback stack.
       callback_pair.second(client_id_vec, object_id);
     }
   };
@@ -69,9 +72,9 @@ void ObjectDirectory::RegisterBackend() {
       object_notification_callback, nullptr));
 }
 
-ray::Status ObjectDirectory::ReportObjectAdded(const ObjectID &object_id,
-                                               const ClientID &client_id,
-                                               const ObjectInfoT &object_info) {
+ray::Status ObjectDirectory::ReportObjectAdded(
+    const ObjectID &object_id, const ClientID &client_id,
+    const object_manager::protocol::ObjectInfoT &object_info) {
   // Append the addition entry to the object table.
   JobID job_id = JobID::nil();
   auto data = std::make_shared<ObjectTableDataT>();
@@ -102,37 +105,32 @@ ray::Status ObjectDirectory::ReportObjectRemoved(const ObjectID &object_id,
   return status;
 };
 
-ray::Status ObjectDirectory::GetInformation(const ClientID &client_id,
-                                            const InfoSuccessCallback &success_callback,
-                                            const InfoFailureCallback &fail_callback) {
-  const ClientTableDataT &data = gcs_client_->client_table().GetClient(client_id);
-  ClientID result_client_id = ClientID::from_binary(data.client_id);
-  if (result_client_id == ClientID::nil() || !data.is_insertion) {
-    fail_callback();
-  } else {
-    const auto &info = RemoteConnectionInfo(client_id, data.node_manager_address,
-                                            (uint16_t)data.object_manager_port);
-    success_callback(info);
+void ObjectDirectory::LookupRemoteConnectionInfo(
+    RemoteConnectionInfo &connection_info) const {
+  ClientTableDataT client_data;
+  gcs_client_->client_table().GetClient(connection_info.client_id, client_data);
+  ClientID result_client_id = ClientID::from_binary(client_data.client_id);
+  if (!result_client_id.is_nil()) {
+    RAY_CHECK(result_client_id == connection_info.client_id);
+    if (client_data.is_insertion) {
+      connection_info.ip = client_data.node_manager_address;
+      connection_info.port = static_cast<uint16_t>(client_data.object_manager_port);
+    }
   }
-  return ray::Status::OK();
 }
 
-void ObjectDirectory::RunFunctionForEachClient(
-    const InfoSuccessCallback &client_function) {
+std::vector<RemoteConnectionInfo> ObjectDirectory::LookupAllRemoteConnections() const {
+  std::vector<RemoteConnectionInfo> remote_connections;
   const auto &clients = gcs_client_->client_table().GetAllClients();
   for (const auto &client_pair : clients) {
-    const ClientTableDataT &data = client_pair.second;
-    if (client_pair.first == ClientID::nil() ||
-        client_pair.first == gcs_client_->client_table().GetLocalClientId() ||
-        !data.is_insertion) {
-      continue;
-    } else {
-      const auto &info =
-          RemoteConnectionInfo(client_pair.first, data.node_manager_address,
-                               static_cast<uint16_t>(data.object_manager_port));
-      client_function(info);
+    RemoteConnectionInfo info(client_pair.first);
+    LookupRemoteConnectionInfo(info);
+    if (info.Connected() &&
+        info.client_id != gcs_client_->client_table().GetLocalClientId()) {
+      remote_connections.push_back(info);
     }
   }
+  return remote_connections;
 }
 
 ray::Status ObjectDirectory::SubscribeObjectLocations(const UniqueID &callback_id,
@@ -155,7 +153,8 @@ ray::Status ObjectDirectory::SubscribeObjectLocations(const UniqueID &callback_i
   // have been evicted from all nodes.
   std::vector<ClientID> client_id_vec(listener_state.current_object_locations.begin(),
                                       listener_state.current_object_locations.end());
-  callback(client_id_vec, object_id);
+  io_service_.post(
+      [callback, client_id_vec, object_id]() { callback(client_id_vec, object_id); });
   return status;
 }
 
@@ -186,9 +185,23 @@ ray::Status ObjectDirectory::LookupLocations(const ObjectID &object_id,
         std::unordered_set<ClientID> client_ids;
         std::vector<ClientID> locations_vector = UpdateObjectLocations(
             client_ids, location_history, gcs_client_->client_table());
+        // It is safe to call the callback directly since this is already running
+        // in the GCS client's lookup callback stack.
         callback(locations_vector, object_id);
       });
   return status;
 }
 
+ray::ClientID ObjectDirectory::GetLocalClientID() {
+  return gcs_client_->client_table().GetLocalClientId();
+}
+
+std::string ObjectDirectory::DebugString() const {
+  std::stringstream result;
+  result << "ObjectDirectory:";
+  result << "\n- num listeners: " << listeners_.size();
+  result << "\n- num eviction entries: " << object_evictions_.size();
+  return result.str();
+}
+
 }  // namespace ray
diff --git a/src/ray/object_manager/object_directory.h b/src/ray/object_manager/object_directory.h
index e77e74a9447d3..e36c4c41604ef 100644
--- a/src/ray/object_manager/object_directory.h
+++ b/src/ray/object_manager/object_directory.h
@@ -9,16 +9,19 @@
 
 #include "ray/gcs/client.h"
 #include "ray/id.h"
+#include "ray/object_manager/format/object_manager_generated.h"
 #include "ray/status.h"
 
 namespace ray {
 
 /// Connection information for remote object managers.
 struct RemoteConnectionInfo {
-  RemoteConnectionInfo() = default;
-  RemoteConnectionInfo(const ClientID &id, const std::string &ip_address,
-                       uint16_t port_num)
-      : client_id(id), ip(ip_address), port(port_num) {}
+  RemoteConnectionInfo(const ClientID &id) : client_id(id) {}
+
+  // Returns whether there is enough information to connect to the remote
+  // object manager.
+  bool Connected() const { return !ip.empty(); }
+
   ClientID client_id;
   std::string ip;
   uint16_t port;
@@ -26,24 +29,23 @@ struct RemoteConnectionInfo {
 
 class ObjectDirectoryInterface {
  public:
-  ObjectDirectoryInterface() = default;
-  virtual ~ObjectDirectoryInterface() = default;
-
-  /// Callbacks for GetInformation.
-  using InfoSuccessCallback = std::function<void(const ray::RemoteConnectionInfo &info)>;
-  using InfoFailureCallback = std::function<void()>;
+  virtual ~ObjectDirectoryInterface() {}
 
   virtual void RegisterBackend() = 0;
 
-  /// This is used to establish object manager client connections.
+  /// Lookup how to connect to a remote object manager.
   ///
-  /// \param client_id The client for which information is required.
-  /// \param success_cb A callback which handles the success of this method.
-  /// \param fail_cb A callback which handles the failure of this method.
-  /// \return Status of whether this asynchronous request succeeded.
-  virtual ray::Status GetInformation(const ClientID &client_id,
-                                     const InfoSuccessCallback &success_cb,
-                                     const InfoFailureCallback &fail_cb) = 0;
+  /// \param connection_info The connection information to fill out. This
+  /// should be pre-populated with the requested client ID. If the directory
+  /// has information about the requested client, then the rest of the fields
+  /// in this struct will be populated accordingly.
+  virtual void LookupRemoteConnectionInfo(
+      RemoteConnectionInfo &connection_info) const = 0;
+
+  /// Get information for all connected remote object managers.
+  ///
+  /// \return A vector of information for all connected remote object managers.
+  virtual std::vector<RemoteConnectionInfo> LookupAllRemoteConnections() const = 0;
 
   /// Callback for object location notifications.
   using OnLocationsFound = std::function<void(const std::vector<ray::ClientID> &,
@@ -90,9 +92,9 @@ class ObjectDirectoryInterface {
   /// \param client_id The client id corresponding to this node.
   /// \param object_info Additional information about the object.
   /// \return Status of whether this method succeeded.
-  virtual ray::Status ReportObjectAdded(const ObjectID &object_id,
-                                        const ClientID &client_id,
-                                        const ObjectInfoT &object_info) = 0;
+  virtual ray::Status ReportObjectAdded(
+      const ObjectID &object_id, const ClientID &client_id,
+      const object_manager::protocol::ObjectInfoT &object_info) = 0;
 
   /// Report objects removed from this client's store to the object directory.
   ///
@@ -102,27 +104,36 @@ class ObjectDirectoryInterface {
   virtual ray::Status ReportObjectRemoved(const ObjectID &object_id,
                                           const ClientID &client_id) = 0;
 
-  /// Go through all the client information.
+  /// Get local client id
+  ///
+  /// \return ClientID
+  virtual ray::ClientID GetLocalClientID() = 0;
+
+  /// Returns debug string for class.
   ///
-  /// \param success_cb A callback which handles the success of this method.
-  /// This function will be called multiple times.
-  /// \return Void.
-  virtual void RunFunctionForEachClient(const InfoSuccessCallback &client_function) = 0;
+  /// \return string.
+  virtual std::string DebugString() const = 0;
 };
 
 /// Ray ObjectDirectory declaration.
 class ObjectDirectory : public ObjectDirectoryInterface {
  public:
-  ObjectDirectory() = default;
-  ~ObjectDirectory() override = default;
+  /// Create an object directory.
+  ///
+  /// \param io_service The event loop to dispatch callbacks to. This should
+  /// usually be the same event loop that the given gcs_client runs on.
+  /// \param gcs_client A Ray GCS client to request object and client
+  /// information from.
+  ObjectDirectory(boost::asio::io_service &io_service,
+                  std::shared_ptr<gcs::AsyncGcsClient> &gcs_client);
+
+  virtual ~ObjectDirectory() {}
 
   void RegisterBackend() override;
 
-  ray::Status GetInformation(const ClientID &client_id,
-                             const InfoSuccessCallback &success_callback,
-                             const InfoFailureCallback &fail_callback) override;
+  void LookupRemoteConnectionInfo(RemoteConnectionInfo &connection_info) const override;
 
-  void RunFunctionForEachClient(const InfoSuccessCallback &client_function) override;
+  std::vector<RemoteConnectionInfo> LookupAllRemoteConnections() const override;
 
   ray::Status LookupLocations(const ObjectID &object_id,
                               const OnLocationsFound &callback) override;
@@ -133,12 +144,15 @@ class ObjectDirectory : public ObjectDirectoryInterface {
   ray::Status UnsubscribeObjectLocations(const UniqueID &callback_id,
                                          const ObjectID &object_id) override;
 
-  ray::Status ReportObjectAdded(const ObjectID &object_id, const ClientID &client_id,
-                                const ObjectInfoT &object_info) override;
+  ray::Status ReportObjectAdded(
+      const ObjectID &object_id, const ClientID &client_id,
+      const object_manager::protocol::ObjectInfoT &object_info) override;
   ray::Status ReportObjectRemoved(const ObjectID &object_id,
                                   const ClientID &client_id) override;
-  /// Ray only (not part of the OD interface).
-  ObjectDirectory(std::shared_ptr<gcs::AsyncGcsClient> &gcs_client);
+
+  ray::ClientID GetLocalClientID() override;
+
+  std::string DebugString() const override;
 
   /// ObjectDirectory should not be copied.
   RAY_DISALLOW_COPY_AND_ASSIGN(ObjectDirectory);
@@ -152,6 +166,8 @@ class ObjectDirectory : public ObjectDirectoryInterface {
     std::unordered_set<ClientID> current_object_locations;
   };
 
+  /// Reference to the event loop.
+  boost::asio::io_service &io_service_;
   /// Reference to the gcs client.
   std::shared_ptr<gcs::AsyncGcsClient> gcs_client_;
   /// Info about subscribers to object locations.
diff --git a/src/ray/object_manager/object_manager.cc b/src/ray/object_manager/object_manager.cc
index e6674fbf15d44..a3cc87c7f17ca 100644
--- a/src/ray/object_manager/object_manager.cc
+++ b/src/ray/object_manager/object_manager.cc
@@ -1,20 +1,11 @@
 #include "ray/object_manager/object_manager.h"
-#include "common/common_protocol.h"
+#include "ray/common/common_protocol.h"
 #include "ray/util/util.h"
 
 namespace asio = boost::asio;
 
 namespace object_manager_protocol = ray::object_manager::protocol;
 
-namespace {
-
-void CheckIOError(ray::Status &status, const std::string &operation) {
-  RAY_CHECK(status.IsIOError());
-  RAY_LOG(ERROR) << "Failed to contact remote object manager during " << operation;
-}
-
-}  // namespace
-
 namespace ray {
 
 ObjectManager::ObjectManager(asio::io_service &main_service,
@@ -23,7 +14,7 @@ ObjectManager::ObjectManager(asio::io_service &main_service,
     // TODO(hme): Eliminate knowledge of GCS.
     : client_id_(gcs_client->client_table().GetLocalClientId()),
       config_(config),
-      object_directory_(new ObjectDirectory(gcs_client)),
+      object_directory_(new ObjectDirectory(main_service, gcs_client)),
       store_notification_(main_service, config_.store_socket_name),
       // release_delay of 2 * config_.max_sends is to ensure the pool does not release
       // an object prematurely whenever we reach the maximum number of sends.
@@ -31,12 +22,15 @@ ObjectManager::ObjectManager(asio::io_service &main_service,
                    /*release_delay=*/2 * config_.max_sends),
       send_work_(send_service_),
       receive_work_(receive_service_),
-      connection_pool_() {
+      connection_pool_(),
+      gen_(std::chrono::high_resolution_clock::now().time_since_epoch().count()) {
   RAY_CHECK(config_.max_sends > 0);
   RAY_CHECK(config_.max_receives > 0);
   main_service_ = &main_service;
   store_notification_.SubscribeObjAdded(
-      [this](const ObjectInfoT &object_info) { HandleObjectAdded(object_info); });
+      [this](const object_manager::protocol::ObjectInfoT &object_info) {
+        HandleObjectAdded(object_info);
+      });
   store_notification_.SubscribeObjDeleted(
       [this](const ObjectID &oid) { NotifyDirectoryObjectDeleted(oid); });
   StartIOService();
@@ -54,13 +48,16 @@ ObjectManager::ObjectManager(asio::io_service &main_service,
                    /*release_delay=*/2 * config_.max_sends),
       send_work_(send_service_),
       receive_work_(receive_service_),
-      connection_pool_() {
+      connection_pool_(),
+      gen_(std::chrono::high_resolution_clock::now().time_since_epoch().count()) {
   RAY_CHECK(config_.max_sends > 0);
   RAY_CHECK(config_.max_receives > 0);
-  // TODO(hme) Client ID is never set with this constructor.
+  client_id_ = object_directory_->GetLocalClientID();
   main_service_ = &main_service;
   store_notification_.SubscribeObjAdded(
-      [this](const ObjectInfoT &object_info) { HandleObjectAdded(object_info); });
+      [this](const object_manager::protocol::ObjectInfoT &object_info) {
+        HandleObjectAdded(object_info);
+      });
   store_notification_.SubscribeObjDeleted(
       [this](const ObjectID &oid) { NotifyDirectoryObjectDeleted(oid); });
   StartIOService();
@@ -94,10 +91,12 @@ void ObjectManager::StopIOService() {
   }
 }
 
-void ObjectManager::HandleObjectAdded(const ObjectInfoT &object_info) {
+void ObjectManager::HandleObjectAdded(
+    const object_manager::protocol::ObjectInfoT &object_info) {
   // Notify the object directory that the object has been added to this node.
   ObjectID object_id = ObjectID::from_binary(object_info.object_id);
-  local_objects_[object_id] = object_info;
+  RAY_CHECK(local_objects_.count(object_id) == 0);
+  local_objects_[object_id].object_info = object_info;
   ray::Status status =
       object_directory_->ReportObjectAdded(object_id, client_id_, object_info);
 
@@ -122,12 +121,14 @@ void ObjectManager::HandleObjectAdded(const ObjectInfoT &object_info) {
 }
 
 void ObjectManager::NotifyDirectoryObjectDeleted(const ObjectID &object_id) {
-  local_objects_.erase(object_id);
+  auto it = local_objects_.find(object_id);
+  RAY_CHECK(it != local_objects_.end());
+  local_objects_.erase(it);
   ray::Status status = object_directory_->ReportObjectRemoved(object_id, client_id_);
 }
 
 ray::Status ObjectManager::SubscribeObjAdded(
-    std::function<void(const ObjectInfoT &)> callback) {
+    std::function<void(const object_manager::protocol::ObjectInfoT &)> callback) {
   store_notification_.SubscribeObjAdded(callback);
   return ray::Status::OK();
 }
@@ -175,15 +176,10 @@ ray::Status ObjectManager::Pull(const ObjectID &object_id) {
             it->second.timer_set = false;
           }
         } else {
-          // New object locations were found.
-          if (!it->second.timer_set) {
-            // The timer was not set, which means that we weren't trying any
-            // clients. We now have some clients to try, so begin trying to
-            // Pull from one.  If we fail to receive an object within the pull
-            // timeout, then this will try the rest of the clients in the list
-            // in succession.
-            TryPull(object_id);
-          }
+          // New object locations were found, so begin trying to pull from a
+          // client. This will be called every time a new client location
+          // appears.
+          TryPull(object_id);
         }
       });
 }
@@ -194,19 +190,30 @@ void ObjectManager::TryPull(const ObjectID &object_id) {
     return;
   }
 
+  auto &client_vector = it->second.client_locations;
+
   // The timer should never fire if there are no expected client locations.
-  RAY_CHECK(!it->second.client_locations.empty());
+  RAY_CHECK(!client_vector.empty());
   RAY_CHECK(local_objects_.count(object_id) == 0);
-
-  // Get the next client to try.
-  const ClientID client_id = std::move(it->second.client_locations.back());
-  it->second.client_locations.pop_back();
+  // Make sure that there is at least one client which is not the local client.
+  // TODO(rkn): It may actually be possible for this check to fail.
+  RAY_CHECK(client_vector.size() != 1 || client_vector[0] != client_id_);
+
+  // Choose a random client to pull the object from.
+  // Generate a random index.
+  std::uniform_int_distribution<int> distribution(0, client_vector.size() - 1);
+  int client_index = distribution(gen_);
+  ClientID client_id = client_vector[client_index];
+  // If the object manager somehow ended up choosing itself, choose a different
+  // object manager.
   if (client_id == client_id_) {
-    // If we're trying to pull from ourselves, skip this client and try the
-    // next one.
-    RAY_LOG(ERROR) << client_id_ << " attempted to pull an object from itself.";
-    const ClientID client_id = std::move(it->second.client_locations.back());
-    it->second.client_locations.pop_back();
+    std::swap(client_vector[client_index], client_vector[client_vector.size() - 1]);
+    client_vector.pop_back();
+    RAY_LOG(ERROR) << "The object manager with client ID " << client_id_
+                   << " is trying to pull object " << object_id
+                   << " but the object table suggests that this object manager "
+                   << "already has the object.";
+    client_id = client_vector[client_index % client_vector.size()];
     RAY_CHECK(client_id != client_id_);
   }
 
@@ -255,46 +262,43 @@ void ObjectManager::PullEstablishConnection(const ObjectID &object_id,
   // TODO(hme): There is no cap on the number of pull request connections.
   connection_pool_.GetSender(ConnectionPool::ConnectionType::MESSAGE, client_id, &conn);
 
+  // Try to create a new connection to the remote object manager if one doesn't
+  // already exist.
   if (conn == nullptr) {
-    status = object_directory_->GetInformation(
-        client_id,
-        [this, object_id, client_id](const RemoteConnectionInfo &connection_info) {
-          std::shared_ptr<SenderConnection> async_conn = CreateSenderConnection(
-              ConnectionPool::ConnectionType::MESSAGE, connection_info);
-          if (async_conn == nullptr) {
-            return;
-          }
-          connection_pool_.RegisterSender(ConnectionPool::ConnectionType::MESSAGE,
-                                          client_id, async_conn);
-          Status pull_send_status = PullSendRequest(object_id, async_conn);
-          if (!pull_send_status.ok()) {
-            CheckIOError(pull_send_status, "Pull");
-          }
-        },
-        []() {
-          RAY_LOG(ERROR) << "Failed to establish connection with remote object manager.";
-        });
-  } else {
-    status = PullSendRequest(object_id, conn);
-    if (!status.ok()) {
-      CheckIOError(status, "Pull");
+    RemoteConnectionInfo connection_info(client_id);
+    object_directory_->LookupRemoteConnectionInfo(connection_info);
+    if (connection_info.Connected()) {
+      conn = CreateSenderConnection(ConnectionPool::ConnectionType::MESSAGE,
+                                    connection_info);
+    } else {
+      RAY_LOG(ERROR) << "Failed to establish connection with remote object manager.";
     }
   }
+
+  if (conn != nullptr) {
+    PullSendRequest(object_id, conn);
+    connection_pool_.ReleaseSender(ConnectionPool::ConnectionType::MESSAGE, conn);
+  }
 }
 
-ray::Status ObjectManager::PullSendRequest(const ObjectID &object_id,
-                                           std::shared_ptr<SenderConnection> &conn) {
+void ObjectManager::PullSendRequest(const ObjectID &object_id,
+                                    std::shared_ptr<SenderConnection> &conn) {
+  // TODO(rkn): This would be a natural place to record a profile event
+  // indicating that a pull request was sent.
+
   flatbuffers::FlatBufferBuilder fbb;
   auto message = object_manager_protocol::CreatePullRequestMessage(
       fbb, fbb.CreateString(client_id_.binary()), fbb.CreateString(object_id.binary()));
   fbb.Finish(message);
-  Status status = conn->WriteMessage(
+  conn->WriteMessageAsync(
       static_cast<int64_t>(object_manager_protocol::MessageType::PullRequest),
-      fbb.GetSize(), fbb.GetBufferPointer());
-  if (status.ok()) {
-    connection_pool_.ReleaseSender(ConnectionPool::ConnectionType::MESSAGE, conn);
-  }
-  return status;
+      fbb.GetSize(), fbb.GetBufferPointer(), [this, conn](ray::Status status) {
+        if (!status.ok()) {
+          RAY_CHECK(status.IsIOError())
+              << "Failed to contact remote object manager during Pull";
+          connection_pool_.RemoveSender(conn);
+        }
+      });
 }
 
 void ObjectManager::HandlePushTaskTimeout(const ObjectID &object_id,
@@ -310,6 +314,46 @@ void ObjectManager::HandlePushTaskTimeout(const ObjectID &object_id,
   }
 }
 
+void ObjectManager::HandleSendFinished(const ObjectID &object_id,
+                                       const ClientID &client_id, uint64_t chunk_index,
+                                       double start_time, double end_time,
+                                       ray::Status status) {
+  if (!status.ok()) {
+    // TODO(rkn): What do we want to do if the send failed?
+  }
+
+  ProfileEventT profile_event;
+  profile_event.event_type = "transfer_send";
+  profile_event.start_time = start_time;
+  profile_event.end_time = end_time;
+  // Encode the object ID, client ID, chunk index, and status as a json list,
+  // which will be parsed by the reader of the profile table.
+  profile_event.extra_data = "[\"" + object_id.hex() + "\",\"" + client_id.hex() + "\"," +
+                             std::to_string(chunk_index) + ",\"" + status.ToString() +
+                             "\"]";
+  profile_events_.push_back(profile_event);
+}
+
+void ObjectManager::HandleReceiveFinished(const ObjectID &object_id,
+                                          const ClientID &client_id, uint64_t chunk_index,
+                                          double start_time, double end_time,
+                                          ray::Status status) {
+  if (!status.ok()) {
+    // TODO(rkn): What do we want to do if the send failed?
+  }
+
+  ProfileEventT profile_event;
+  profile_event.event_type = "transfer_receive";
+  profile_event.start_time = start_time;
+  profile_event.end_time = end_time;
+  // Encode the object ID, client ID, chunk index, and status as a json list,
+  // which will be parsed by the reader of the profile table.
+  profile_event.extra_data = "[\"" + object_id.hex() + "\",\"" + client_id.hex() + "\"," +
+                             std::to_string(chunk_index) + ",\"" + status.ToString() +
+                             "\"]";
+  profile_events_.push_back(profile_event);
+}
+
 void ObjectManager::Push(const ObjectID &object_id, const ClientID &client_id) {
   if (local_objects_.count(object_id) == 0) {
     // Avoid setting duplicated timer for the same object and client pair.
@@ -343,35 +387,68 @@ void ObjectManager::Push(const ObjectID &object_id, const ClientID &client_id) {
     return;
   }
 
-  // TODO(hme): Cache this data in ObjectDirectory.
-  // Okay for now since the GCS client caches this data.
-  RAY_CHECK_OK(object_directory_->GetInformation(
-      client_id,
-      [this, object_id, client_id](const RemoteConnectionInfo &info) {
-        const ObjectInfoT &object_info = local_objects_[object_id];
-        uint64_t data_size =
-            static_cast<uint64_t>(object_info.data_size + object_info.metadata_size);
-        uint64_t metadata_size = static_cast<uint64_t>(object_info.metadata_size);
-        uint64_t num_chunks = buffer_pool_.GetNumChunks(data_size);
-        for (uint64_t chunk_index = 0; chunk_index < num_chunks; ++chunk_index) {
-          send_service_.post([this, client_id, object_id, data_size, metadata_size,
-                              chunk_index, info]() {
-            ExecuteSendObject(client_id, object_id, data_size, metadata_size, chunk_index,
-                              info);
-          });
-        }
-      },
-      []() {
-        // Push is best effort, so do nothing here.
-        RAY_LOG(ERROR)
-            << "Failed to establish connection for Push with remote object manager.";
-      }));
-}
-
-void ObjectManager::ExecuteSendObject(const ClientID &client_id,
-                                      const ObjectID &object_id, uint64_t data_size,
-                                      uint64_t metadata_size, uint64_t chunk_index,
-                                      const RemoteConnectionInfo &connection_info) {
+  // If we haven't pushed this object to this same object manager yet, then push
+  // it. If we have, but it was a long time ago, then push it. If we have and it
+  // was recent, then don't do it again.
+  auto &recent_pushes = local_objects_[object_id].recent_pushes;
+  auto it = recent_pushes.find(client_id);
+  if (it == recent_pushes.end()) {
+    // We haven't pushed this specific object to this specific object manager
+    // yet (or if we have then the object must have been evicted and recreated
+    // locally).
+    recent_pushes[client_id] = current_sys_time_ms();
+  } else {
+    int64_t current_time = current_sys_time_ms();
+    if (current_time - it->second <=
+        RayConfig::instance().object_manager_repeated_push_delay_ms()) {
+      // We pushed this object to the object manager recently, so don't do it
+      // again.
+      return;
+    } else {
+      it->second = current_time;
+    }
+  }
+
+  RemoteConnectionInfo connection_info(client_id);
+  object_directory_->LookupRemoteConnectionInfo(connection_info);
+  if (connection_info.Connected()) {
+    const object_manager::protocol::ObjectInfoT &object_info =
+        local_objects_[object_id].object_info;
+    uint64_t data_size =
+        static_cast<uint64_t>(object_info.data_size + object_info.metadata_size);
+    uint64_t metadata_size = static_cast<uint64_t>(object_info.metadata_size);
+    uint64_t num_chunks = buffer_pool_.GetNumChunks(data_size);
+    for (uint64_t chunk_index = 0; chunk_index < num_chunks; ++chunk_index) {
+      send_service_.post([this, client_id, object_id, data_size, metadata_size,
+                          chunk_index, connection_info]() {
+        double start_time = current_sys_time_seconds();
+        // NOTE: When this callback executes, it's possible that the object
+        // will have already been evicted. It's also possible that the
+        // object could be in the process of being transferred to this
+        // object manager from another object manager.
+        ray::Status status = ExecuteSendObject(
+            client_id, object_id, data_size, metadata_size, chunk_index, connection_info);
+        double end_time = current_sys_time_seconds();
+
+        // Notify the main thread that we have finished sending the chunk.
+        main_service_->post(
+            [this, object_id, client_id, chunk_index, start_time, end_time, status]() {
+              HandleSendFinished(object_id, client_id, chunk_index, start_time, end_time,
+                                 status);
+            });
+      });
+    }
+  } else {
+    // Push is best effort, so do nothing here.
+    RAY_LOG(ERROR)
+        << "Failed to establish connection for Push with remote object manager.";
+  }
+}
+
+ray::Status ObjectManager::ExecuteSendObject(
+    const ClientID &client_id, const ObjectID &object_id, uint64_t data_size,
+    uint64_t metadata_size, uint64_t chunk_index,
+    const RemoteConnectionInfo &connection_info) {
   RAY_LOG(DEBUG) << "ExecuteSendObject " << client_id << " " << object_id << " "
                  << chunk_index;
   ray::Status status;
@@ -380,16 +457,17 @@ void ObjectManager::ExecuteSendObject(const ClientID &client_id,
   if (conn == nullptr) {
     conn =
         CreateSenderConnection(ConnectionPool::ConnectionType::TRANSFER, connection_info);
-    connection_pool_.RegisterSender(ConnectionPool::ConnectionType::TRANSFER, client_id,
-                                    conn);
-    if (conn == nullptr) {
-      return;
-    }
   }
-  status = SendObjectHeaders(object_id, data_size, metadata_size, chunk_index, conn);
-  if (!status.ok()) {
-    CheckIOError(status, "Push");
+
+  if (conn != nullptr) {
+    status = SendObjectHeaders(object_id, data_size, metadata_size, chunk_index, conn);
+    if (!status.ok()) {
+      RAY_CHECK(status.IsIOError())
+          << "Failed to contact remote object manager during Push";
+      connection_pool_.RemoveSender(conn);
+    }
   }
+  return status;
 }
 
 ray::Status ObjectManager::SendObjectHeaders(const ObjectID &object_id,
@@ -402,15 +480,19 @@ ray::Status ObjectManager::SendObjectHeaders(const ObjectID &object_id,
 
   // Fail on status not okay. The object is local, and there is
   // no other anticipated error here.
-  RAY_CHECK_OK(chunk_status.second);
+  ray::Status status = chunk_status.second;
+  if (!chunk_status.second.ok()) {
+    RAY_LOG(WARNING) << "Attempting to push object " << object_id
+                     << " which is not local. It may have been evicted.";
+    RAY_RETURN_NOT_OK(status);
+  }
 
   // Create buffer.
   flatbuffers::FlatBufferBuilder fbb;
-  // TODO(hme): use to_flatbuf
   auto message = object_manager_protocol::CreatePushRequestMessage(
-      fbb, fbb.CreateString(object_id.binary()), chunk_index, data_size, metadata_size);
+      fbb, to_flatbuf(fbb, object_id), chunk_index, data_size, metadata_size);
   fbb.Finish(message);
-  ray::Status status = conn->WriteMessage(
+  status = conn->WriteMessage(
       static_cast<int64_t>(object_manager_protocol::MessageType::PushRequest),
       fbb.GetSize(), fbb.GetBufferPointer());
   if (!status.ok()) {
@@ -532,23 +614,13 @@ void ObjectManager::SubscribeRemainingWaitObjects(const UniqueID &wait_id) {
       wait_state.timeout_ms == 0) {
     // Requirements already satisfied.
     WaitComplete(wait_id);
-  } else {
-    // Wait may complete during the execution of any one of the following calls to
-    // SubscribeObjectLocations, so copy the object ids that need to be iterated over.
-    // Order matters for test purposes.
-    std::vector<ObjectID> ordered_remaining_object_ids;
-    for (const auto &object_id : wait_state.object_id_order) {
-      if (wait_state.remaining.count(object_id) > 0) {
-        ordered_remaining_object_ids.push_back(object_id);
-      }
-    }
-    for (const auto &object_id : ordered_remaining_object_ids) {
-      if (active_wait_requests_.find(wait_id) == active_wait_requests_.end()) {
-        // This is possible if an object's location is obtained immediately,
-        // within the current callstack. In this case, WaitComplete has been
-        // invoked already, so we're done.
-        return;
-      }
+    return;
+  }
+
+  // There are objects remaining whose locations we don't know. Request their
+  // locations from the object directory.
+  for (const auto &object_id : wait_state.object_id_order) {
+    if (wait_state.remaining.count(object_id) > 0) {
       wait_state.requested_objects.insert(object_id);
       // Subscribe to object notifications.
       RAY_CHECK_OK(object_directory_->SubscribeObjectLocations(
@@ -556,9 +628,13 @@ void ObjectManager::SubscribeRemainingWaitObjects(const UniqueID &wait_id) {
                                               const ObjectID &subscribe_object_id) {
             if (!client_ids.empty()) {
               auto object_id_wait_state = active_wait_requests_.find(wait_id);
-              // We never expect to handle a subscription notification for a wait that has
-              // already completed.
-              RAY_CHECK(object_id_wait_state != active_wait_requests_.end());
+              if (object_id_wait_state == active_wait_requests_.end()) {
+                // Depending on the timing of calls to the object directory, we
+                // may get a subscription notification after the wait call has
+                // already completed. If so, then don't process the
+                // notification.
+                return;
+              }
               auto &wait_state = object_id_wait_state->second;
               RAY_CHECK(wait_state.remaining.erase(subscribe_object_id));
               wait_state.found.insert(subscribe_object_id);
@@ -571,6 +647,10 @@ void ObjectManager::SubscribeRemainingWaitObjects(const UniqueID &wait_id) {
             }
           }));
     }
+
+    // If a timeout was provided, then set a timer. If we don't find locations
+    // for enough objects by the time the timer expires, then we will return
+    // from the Wait.
     if (wait_state.timeout_ms != -1) {
       auto timeout = boost::posix_time::milliseconds(wait_state.timeout_ms);
       wait_state.timeout_timer->expires_from_now(timeout);
@@ -630,19 +710,21 @@ std::shared_ptr<SenderConnection> ObjectManager::CreateSenderConnection(
       SenderConnection::Create(*main_service_, info.client_id, info.ip, info.port);
   if (conn == nullptr) {
     RAY_LOG(ERROR) << "Failed to connect to remote object manager.";
-    return conn;
+  } else {
+    // Register the new connection.
+    connection_pool_.RegisterSender(type, info.client_id, conn);
+    // Prepare client connection info buffer
+    flatbuffers::FlatBufferBuilder fbb;
+    bool is_transfer = (type == ConnectionPool::ConnectionType::TRANSFER);
+    auto message = object_manager_protocol::CreateConnectClientMessage(
+        fbb, to_flatbuf(fbb, client_id_), is_transfer);
+    fbb.Finish(message);
+    // Send synchronously.
+    // TODO(swang): Make this a WriteMessageAsync.
+    RAY_CHECK_OK(conn->WriteMessage(
+        static_cast<int64_t>(object_manager_protocol::MessageType::ConnectClient),
+        fbb.GetSize(), fbb.GetBufferPointer()));
   }
-  // Prepare client connection info buffer
-  flatbuffers::FlatBufferBuilder fbb;
-  bool is_transfer = (type == ConnectionPool::ConnectionType::TRANSFER);
-  auto message = object_manager_protocol::CreateConnectClientMessage(
-      fbb, fbb.CreateString(client_id_.binary()), is_transfer);
-  fbb.Finish(message);
-  // Send synchronously.
-  RAY_CHECK_OK(conn->WriteMessage(
-      static_cast<int64_t>(object_manager_protocol::MessageType::ConnectClient),
-      fbb.GetSize(), fbb.GetBufferPointer()));
-  // The connection is ready; return to caller.
   return conn;
 }
 
@@ -699,6 +781,9 @@ void ObjectManager::ConnectClient(std::shared_ptr<TcpClientConnection> &conn,
 void ObjectManager::DisconnectClient(std::shared_ptr<TcpClientConnection> &conn,
                                      const uint8_t *message) {
   connection_pool_.RemoveReceiver(conn);
+
+  // We don't need to clean up unfulfilled_push_requests_ because the
+  // unfulfilled push timers will fire and clean it up.
 }
 
 void ObjectManager::ReceivePullRequest(std::shared_ptr<TcpClientConnection> &conn,
@@ -707,6 +792,14 @@ void ObjectManager::ReceivePullRequest(std::shared_ptr<TcpClientConnection> &con
   auto pr = flatbuffers::GetRoot<object_manager_protocol::PullRequestMessage>(message);
   ObjectID object_id = ObjectID::from_binary(pr->object_id()->str());
   ClientID client_id = ClientID::from_binary(pr->client_id()->str());
+
+  ProfileEventT profile_event;
+  profile_event.event_type = "receive_pull_request";
+  profile_event.start_time = current_sys_time_seconds();
+  profile_event.end_time = profile_event.start_time;
+  profile_event.extra_data = "[\"" + object_id.hex() + "\",\"" + client_id.hex() + "\"]";
+  profile_events_.push_back(profile_event);
+
   Push(object_id, client_id);
   conn->ProcessMessages();
 }
@@ -716,20 +809,29 @@ void ObjectManager::ReceivePushRequest(std::shared_ptr<TcpClientConnection> &con
   // Serialize.
   auto object_header =
       flatbuffers::GetRoot<object_manager_protocol::PushRequestMessage>(message);
-  ObjectID object_id = ObjectID::from_binary(object_header->object_id()->str());
+  const ObjectID object_id = ObjectID::from_binary(object_header->object_id()->str());
   uint64_t chunk_index = object_header->chunk_index();
   uint64_t data_size = object_header->data_size();
   uint64_t metadata_size = object_header->metadata_size();
   receive_service_.post([this, object_id, data_size, metadata_size, chunk_index, conn]() {
-    ExecuteReceiveObject(conn->GetClientID(), object_id, data_size, metadata_size,
-                         chunk_index, *conn);
+    double start_time = current_sys_time_seconds();
+    const ClientID client_id = conn->GetClientId();
+    auto status = ExecuteReceiveObject(client_id, object_id, data_size, metadata_size,
+                                       chunk_index, *conn);
+    double end_time = current_sys_time_seconds();
+    // Notify the main thread that we have finished receiving the object.
+    main_service_->post(
+        [this, object_id, client_id, chunk_index, start_time, end_time, status]() {
+          HandleReceiveFinished(object_id, client_id, chunk_index, start_time, end_time,
+                                status);
+        });
+
   });
 }
 
-void ObjectManager::ExecuteReceiveObject(const ClientID &client_id,
-                                         const ObjectID &object_id, uint64_t data_size,
-                                         uint64_t metadata_size, uint64_t chunk_index,
-                                         TcpClientConnection &conn) {
+ray::Status ObjectManager::ExecuteReceiveObject(
+    const ClientID &client_id, const ObjectID &object_id, uint64_t data_size,
+    uint64_t metadata_size, uint64_t chunk_index, TcpClientConnection &conn) {
   RAY_LOG(DEBUG) << "ExecuteReceiveObject " << client_id << " " << object_id << " "
                  << chunk_index;
 
@@ -749,7 +851,7 @@ void ObjectManager::ExecuteReceiveObject(const ClientID &client_id,
       // TODO(hme): This chunk failed, so create a pull request for this chunk.
     }
   } else {
-    RAY_LOG(ERROR) << "Create Chunk Failed index = " << chunk_index << ": "
+    RAY_LOG(DEBUG) << "Create Chunk Failed index = " << chunk_index << ": "
                    << chunk_status.second.message();
     // Read object into empty buffer.
     uint64_t buffer_length = buffer_pool_.GetBufferLength(chunk_index, data_size);
@@ -767,6 +869,8 @@ void ObjectManager::ExecuteReceiveObject(const ClientID &client_id,
   conn.ProcessMessages();
   RAY_LOG(DEBUG) << "ReceiveCompleted " << client_id_ << " " << object_id << " "
                  << "/" << config_.max_receives;
+
+  return chunk_status.second;
 }
 
 void ObjectManager::ReceiveFreeRequest(std::shared_ptr<TcpClientConnection> &conn,
@@ -795,25 +899,59 @@ void ObjectManager::SpreadFreeObjectRequest(const std::vector<ObjectID> &object_
   flatbuffers::Offset<object_manager_protocol::FreeRequestMessage> request =
       object_manager_protocol::CreateFreeRequestMessage(fbb, to_flatbuf(fbb, object_ids));
   fbb.Finish(request);
-  auto function_on_client = [this, &fbb](const RemoteConnectionInfo &connection_info) {
+
+  const auto remote_connections = object_directory_->LookupAllRemoteConnections();
+  for (const auto &connection_info : remote_connections) {
     std::shared_ptr<SenderConnection> conn;
     connection_pool_.GetSender(ConnectionPool::ConnectionType::MESSAGE,
                                connection_info.client_id, &conn);
     if (conn == nullptr) {
       conn = CreateSenderConnection(ConnectionPool::ConnectionType::MESSAGE,
                                     connection_info);
-      connection_pool_.RegisterSender(ConnectionPool::ConnectionType::MESSAGE,
-                                      connection_info.client_id, conn);
     }
-    ray::Status status = conn->WriteMessage(
-        static_cast<int64_t>(object_manager_protocol::MessageType::FreeRequest),
-        fbb.GetSize(), fbb.GetBufferPointer());
-    if (status.ok()) {
+
+    if (conn != nullptr) {
+      conn->WriteMessageAsync(
+          static_cast<int64_t>(object_manager_protocol::MessageType::FreeRequest),
+          fbb.GetSize(), fbb.GetBufferPointer(), [this, conn](ray::Status status) {
+            if (!status.ok()) {
+              RAY_CHECK(status.IsIOError())
+                  << "Failed to contact remote object manager during Free";
+              connection_pool_.RemoveSender(conn);
+            }
+          });
       connection_pool_.ReleaseSender(ConnectionPool::ConnectionType::MESSAGE, conn);
     }
-    // TODO(Yuhong): Implement ConnectionPool::RemoveSender and call it in "else".
-  };
-  object_directory_->RunFunctionForEachClient(function_on_client);
+  }
+}
+
+ProfileTableDataT ObjectManager::GetAndResetProfilingInfo() {
+  ProfileTableDataT profile_info;
+  profile_info.component_type = "object_manager";
+  profile_info.component_id = client_id_.binary();
+
+  for (auto const &profile_event : profile_events_) {
+    profile_info.profile_events.emplace_back(new ProfileEventT(profile_event));
+  }
+
+  profile_events_.clear();
+
+  return profile_info;
+}
+
+std::string ObjectManager::DebugString() const {
+  std::stringstream result;
+  result << "ObjectManager:";
+  result << "\n- num local objects: " << local_objects_.size();
+  result << "\n- num active wait requests: " << active_wait_requests_.size();
+  result << "\n- num unfulfilled push requests: " << unfulfilled_push_requests_.size();
+  result << "\n- num pull requests: " << pull_requests_.size();
+  result << "\n- num buffered profile events: " << profile_events_.size();
+  result << "\n" << object_directory_->DebugString();
+  result << "\n" << store_notification_.DebugString();
+  result << "\n" << buffer_pool_.DebugString();
+  result << "\n" << connection_pool_.DebugString();
+  return result.str();
 }
 
 }  // namespace ray
diff --git a/src/ray/object_manager/object_manager.h b/src/ray/object_manager/object_manager.h
index 11b5d7a6cd8ac..b2583376701e2 100644
--- a/src/ray/object_manager/object_manager.h
+++ b/src/ray/object_manager/object_manager.h
@@ -6,6 +6,7 @@
 #include <deque>
 #include <map>
 #include <memory>
+#include <random>
 #include <thread>
 
 #include <boost/asio.hpp>
@@ -29,6 +30,10 @@
 namespace ray {
 
 struct ObjectManagerConfig {
+  /// The port that the object manager should use to listen for connections
+  /// from other object managers. If this is 0, the object manager will choose
+  /// its own port.
+  int object_manager_port;
   /// The time in milliseconds to wait before retrying a pull
   /// that fails due to client id lookup.
   uint pull_timeout_ms;
@@ -47,6 +52,14 @@ struct ObjectManagerConfig {
   int push_timeout_ms;
 };
 
+struct LocalObjectInfo {
+  /// Information from the object store about the object.
+  object_manager::protocol::ObjectInfoT object_info;
+  /// A map from the ID of a remote object manager to the timestamp of when
+  /// the object was last pushed to that object manager (if a push took place).
+  std::unordered_map<ClientID, int64_t> recent_pushes;
+};
+
 class ObjectManagerInterface {
  public:
   virtual ray::Status Pull(const ObjectID &object_id) = 0;
@@ -88,7 +101,8 @@ class ObjectManager : public ObjectManagerInterface {
   /// already exist in the local store.
   /// \param callback The callback to invoke when objects are added to the local store.
   /// \return Status of whether adding the subscription succeeded.
-  ray::Status SubscribeObjAdded(std::function<void(const ObjectInfoT &)> callback);
+  ray::Status SubscribeObjAdded(
+      std::function<void(const object_manager::protocol::ObjectInfoT &)> callback);
 
   /// Subscribe to notifications of objects deleted from local store.
   ///
@@ -97,7 +111,9 @@ class ObjectManager : public ObjectManagerInterface {
   /// \return Status of whether adding the subscription succeeded.
   ray::Status SubscribeObjDeleted(std::function<void(const ray::ObjectID &)> callback);
 
-  /// Push an object to to the node manager on the node corresponding to client id.
+  /// Consider pushing an object to a remote object manager. This object manager
+  /// may choose to ignore the Push call (e.g., if Push is called twice in a row
+  /// on the same object, the second one might be ignored).
   ///
   /// \param object_id The object's object id.
   /// \param client_id The remote node's client id.
@@ -170,6 +186,17 @@ class ObjectManager : public ObjectManagerInterface {
   ///                   or send it to all the object stores.
   void FreeObjects(const std::vector<ObjectID> &object_ids, bool local_only);
 
+  /// Return profiling information and reset the profiling information.
+  ///
+  /// \return All profiling information that has accumulated since the last call
+  /// to this method.
+  ProfileTableDataT GetAndResetProfilingInfo();
+
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  private:
   friend class TestObjectManager;
 
@@ -235,7 +262,7 @@ class ObjectManager : public ObjectManagerInterface {
   /// Handle an object being added to this node. This adds the object to the
   /// directory, pushes the object to other nodes if necessary, and cancels any
   /// outstanding Pull requests for the object.
-  void HandleObjectAdded(const ObjectInfoT &object_info);
+  void HandleObjectAdded(const object_manager::protocol::ObjectInfoT &object_info);
 
   /// Register object remove with directory.
   void NotifyDirectoryObjectDeleted(const ObjectID &object_id);
@@ -245,19 +272,57 @@ class ObjectManager : public ObjectManagerInterface {
   /// Executes on main_service_ thread.
   void PullEstablishConnection(const ObjectID &object_id, const ClientID &client_id);
 
-  /// Synchronously send a pull request via remote object manager connection.
+  /// Asynchronously send a pull request via remote object manager connection.
   /// Executes on main_service_ thread.
-  ray::Status PullSendRequest(const ObjectID &object_id,
-                              std::shared_ptr<SenderConnection> &conn);
+  ///
+  /// \param object_id The ID of the object request.
+  /// \param conn The connection to the remote object manager.
+  /// \return Void.
+  void PullSendRequest(const ObjectID &object_id,
+                       std::shared_ptr<SenderConnection> &conn);
 
   std::shared_ptr<SenderConnection> CreateSenderConnection(
       ConnectionPool::ConnectionType type, RemoteConnectionInfo info);
 
+  /// This is used to notify the main thread that the sending of a chunk has
+  /// completed.
+  ///
+  /// \param object_id The ID of the object that was sent.
+  /// \param client_id The ID of the client that the chunk was sent to.
+  /// \param chunk_index The index of the chunk.
+  /// \param start_time_us The time when the object manager began sending the
+  /// chunk.
+  /// \param end_time_us The time when the object manager finished sending the
+  /// chunk.
+  /// \param status The status of the send (e.g., did it succeed or fail).
+  /// \return Void.
+  void HandleSendFinished(const ObjectID &object_id, const ClientID &client_id,
+                          uint64_t chunk_index, double start_time_us, double end_time_us,
+                          ray::Status status);
+
+  /// This is used to notify the main thread that the receiving of a chunk has
+  /// completed.
+  ///
+  /// \param object_id The ID of the object that was received.
+  /// \param client_id The ID of the client that the chunk was received from.
+  /// \param chunk_index The index of the chunk.
+  /// \param start_time_us The time when the object manager began receiving the
+  /// chunk.
+  /// \param end_time_us The time when the object manager finished receiving the
+  /// chunk.
+  /// \param status The status of the receive (e.g., did it succeed or fail).
+  /// \return Void.
+  void HandleReceiveFinished(const ObjectID &object_id, const ClientID &client_id,
+                             uint64_t chunk_index, double start_time_us,
+                             double end_time_us, ray::Status status);
+
   /// Begin executing a send.
   /// Executes on send_service_ thread pool.
-  void ExecuteSendObject(const ClientID &client_id, const ObjectID &object_id,
-                         uint64_t data_size, uint64_t metadata_size, uint64_t chunk_index,
-                         const RemoteConnectionInfo &connection_info);
+  ray::Status ExecuteSendObject(const ClientID &client_id, const ObjectID &object_id,
+                                uint64_t data_size, uint64_t metadata_size,
+                                uint64_t chunk_index,
+                                const RemoteConnectionInfo &connection_info);
+
   /// This method synchronously sends the object id and object size
   /// to the remote object manager.
   /// Executes on send_service_ thread pool.
@@ -275,10 +340,11 @@ class ObjectManager : public ObjectManagerInterface {
   /// This will invoke the object receive on the receive_service_ thread pool.
   void ReceivePushRequest(std::shared_ptr<TcpClientConnection> &conn,
                           const uint8_t *message);
+
   /// Execute a receive on the receive_service_ thread pool.
-  void ExecuteReceiveObject(const ClientID &client_id, const ObjectID &object_id,
-                            uint64_t data_size, uint64_t metadata_size,
-                            uint64_t chunk_index, TcpClientConnection &conn);
+  ray::Status ExecuteReceiveObject(const ClientID &client_id, const ObjectID &object_id,
+                                   uint64_t data_size, uint64_t metadata_size,
+                                   uint64_t chunk_index, TcpClientConnection &conn);
 
   /// Handles receiving a pull request message.
   void ReceivePullRequest(std::shared_ptr<TcpClientConnection> &conn,
@@ -327,8 +393,9 @@ class ObjectManager : public ObjectManagerInterface {
   /// Connection pool for reusing outgoing connections to remote object managers.
   ConnectionPool connection_pool_;
 
-  /// Cache of locally available objects.
-  std::unordered_map<ObjectID, ObjectInfoT> local_objects_;
+  /// Mapping from locally available objects to information about those objects
+  /// including when the object was last pushed to other object managers.
+  std::unordered_map<ObjectID, LocalObjectInfo> local_objects_;
 
   /// This is used as the callback identifier in Pull for
   /// SubscribeObjectLocations. We only need one identifier because we never need to
@@ -345,7 +412,16 @@ class ObjectManager : public ObjectManagerInterface {
       std::unordered_map<ClientID, std::unique_ptr<boost::asio::deadline_timer>>>
       unfulfilled_push_requests_;
 
+  /// The objects that this object manager is currently trying to fetch from
+  /// remote object managers.
   std::unordered_map<ObjectID, PullRequest> pull_requests_;
+
+  /// Profiling events that are to be batched together and added to the profile
+  /// table in the GCS.
+  std::vector<ProfileEventT> profile_events_;
+
+  /// Internally maintained random number generator.
+  std::mt19937_64 gen_;
 };
 
 }  // namespace ray
diff --git a/src/ray/object_manager/object_manager_client_connection.cc b/src/ray/object_manager/object_manager_client_connection.cc
index c612e1703cc35..dadfd72cef100 100644
--- a/src/ray/object_manager/object_manager_client_connection.cc
+++ b/src/ray/object_manager/object_manager_client_connection.cc
@@ -11,7 +11,7 @@ std::shared_ptr<SenderConnection> SenderConnection::Create(
   Status status = TcpConnect(socket, ip, port);
   if (status.ok()) {
     std::shared_ptr<TcpServerConnection> conn =
-        std::make_shared<TcpServerConnection>(std::move(socket));
+        TcpServerConnection::Create(std::move(socket));
     return std::make_shared<SenderConnection>(std::move(conn), client_id);
   } else {
     return nullptr;
diff --git a/src/ray/object_manager/object_manager_client_connection.h b/src/ray/object_manager/object_manager_client_connection.h
index 1c8661b0ddc0d..3b00b1a302e58 100644
--- a/src/ray/object_manager/object_manager_client_connection.h
+++ b/src/ray/object_manager/object_manager_client_connection.h
@@ -10,12 +10,13 @@
 #include <boost/bind.hpp>
 #include <boost/enable_shared_from_this.hpp>
 
-#include "common/state/ray_config.h"
 #include "ray/common/client_connection.h"
 #include "ray/id.h"
+#include "ray/ray_config.h"
 
 namespace ray {
 
+// TODO(ekl) this class can be replaced with a plain ClientConnection
 class SenderConnection : public boost::enable_shared_from_this<SenderConnection> {
  public:
   /// Create a connection for sending data to other object managers.
@@ -44,6 +45,17 @@ class SenderConnection : public boost::enable_shared_from_this<SenderConnection>
     return conn_->WriteMessage(type, length, message);
   }
 
+  /// Write a message to the client asynchronously.
+  ///
+  /// \param type The message type (e.g., a flatbuffer enum).
+  /// \param length The size in bytes of the message.
+  /// \param message A pointer to the message buffer.
+  /// \param handler A callback to run on write completion.
+  void WriteMessageAsync(int64_t type, int64_t length, const uint8_t *message,
+                         const std::function<void(const ray::Status &)> &handler) {
+    conn_->WriteMessageAsync(type, length, message, handler);
+  }
+
   /// Write a buffer to this connection.
   ///
   /// \param buffer The buffer.
@@ -62,7 +74,7 @@ class SenderConnection : public boost::enable_shared_from_this<SenderConnection>
   }
 
   /// \return The ClientID of this connection.
-  const ClientID &GetClientID() { return client_id_; }
+  const ClientID &GetClientId() { return client_id_; }
 
  private:
   bool operator==(const SenderConnection &rhs) const {
diff --git a/src/ray/object_manager/object_store_notification_manager.cc b/src/ray/object_manager/object_store_notification_manager.cc
index 4d7c401ee2234..e590e8efa549d 100644
--- a/src/ray/object_manager/object_store_notification_manager.cc
+++ b/src/ray/object_manager/object_store_notification_manager.cc
@@ -5,8 +5,7 @@
 #include <boost/bind.hpp>
 #include <boost/function.hpp>
 
-#include "common/common.h"
-#include "common/common_protocol.h"
+#include "ray/common/common_protocol.h"
 
 #include "ray/object_manager/object_store_notification_manager.h"
 #include "ray/util/util.h"
@@ -48,35 +47,41 @@ void ObjectStoreNotificationManager::ProcessStoreLength(
 void ObjectStoreNotificationManager::ProcessStoreNotification(
     const boost::system::error_code &error) {
   if (error.value() != boost::system::errc::success) {
-    RAY_LOG(FATAL) << boost_to_ray_status(error).ToString();
+    RAY_LOG(FATAL)
+        << "Problem communicating with the object store from raylet, check logs or "
+        << "dmesg for previous errors: " << boost_to_ray_status(error).ToString();
   }
 
-  const auto &object_info = flatbuffers::GetRoot<ObjectInfo>(notification_.data());
+  const auto &object_info =
+      flatbuffers::GetRoot<object_manager::protocol::ObjectInfo>(notification_.data());
   const auto &object_id = from_flatbuf(*object_info->object_id());
   if (object_info->is_deletion()) {
     ProcessStoreRemove(object_id);
   } else {
-    ObjectInfoT result;
+    object_manager::protocol::ObjectInfoT result;
     object_info->UnPackTo(&result);
     ProcessStoreAdd(result);
   }
   NotificationWait();
 }
 
-void ObjectStoreNotificationManager::ProcessStoreAdd(const ObjectInfoT &object_info) {
+void ObjectStoreNotificationManager::ProcessStoreAdd(
+    const object_manager::protocol::ObjectInfoT &object_info) {
   for (auto &handler : add_handlers_) {
     handler(object_info);
   }
+  num_adds_processed_++;
 }
 
 void ObjectStoreNotificationManager::ProcessStoreRemove(const ObjectID &object_id) {
   for (auto &handler : rem_handlers_) {
     handler(object_id);
   }
+  num_removes_processed_++;
 }
 
 void ObjectStoreNotificationManager::SubscribeObjAdded(
-    std::function<void(const ObjectInfoT &)> callback) {
+    std::function<void(const object_manager::protocol::ObjectInfoT &)> callback) {
   add_handlers_.push_back(std::move(callback));
 }
 
@@ -85,4 +90,12 @@ void ObjectStoreNotificationManager::SubscribeObjDeleted(
   rem_handlers_.push_back(std::move(callback));
 }
 
+std::string ObjectStoreNotificationManager::DebugString() const {
+  std::stringstream result;
+  result << "ObjectStoreNotificationManager:";
+  result << "\n- num adds processed: " << num_adds_processed_;
+  result << "\n- num removes processed: " << num_removes_processed_;
+  return result.str();
+}
+
 }  // namespace ray
diff --git a/src/ray/object_manager/object_store_notification_manager.h b/src/ray/object_manager/object_store_notification_manager.h
index 592486e84fa99..45d131602d77d 100644
--- a/src/ray/object_manager/object_store_notification_manager.h
+++ b/src/ray/object_manager/object_store_notification_manager.h
@@ -38,13 +38,19 @@ class ObjectStoreNotificationManager {
   /// already exist in the local store
   ///
   /// \param callback A callback expecting an ObjectID.
-  void SubscribeObjAdded(std::function<void(const ObjectInfoT &)> callback);
+  void SubscribeObjAdded(
+      std::function<void(const object_manager::protocol::ObjectInfoT &)> callback);
 
   /// Subscribe to notifications of objects deleted from local store.
   ///
   /// \param callback A callback expecting an ObjectID.
   void SubscribeObjDeleted(std::function<void(const ray::ObjectID &)> callback);
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  private:
   /// Async loop for handling object store notifications.
   void NotificationWait();
@@ -52,15 +58,18 @@ class ObjectStoreNotificationManager {
   void ProcessStoreNotification(const boost::system::error_code &error);
 
   /// Support for rebroadcasting object add/rem events.
-  void ProcessStoreAdd(const ObjectInfoT &object_info);
+  void ProcessStoreAdd(const object_manager::protocol::ObjectInfoT &object_info);
   void ProcessStoreRemove(const ObjectID &object_id);
 
-  std::vector<std::function<void(const ObjectInfoT &)>> add_handlers_;
+  std::vector<std::function<void(const object_manager::protocol::ObjectInfoT &)>>
+      add_handlers_;
   std::vector<std::function<void(const ray::ObjectID &)>> rem_handlers_;
 
   plasma::PlasmaClient store_client_;
   int c_socket_;
   int64_t length_;
+  int64_t num_adds_processed_;
+  int64_t num_removes_processed_;
   std::vector<uint8_t> notification_;
   boost::asio::local::stream_protocol::socket socket_;
 };
diff --git a/src/ray/object_manager/test/object_manager_stress_test.cc b/src/ray/object_manager/test/object_manager_stress_test.cc
index f421fb9cf4ad2..c7f38b0c7f1d7 100644
--- a/src/ray/object_manager/test/object_manager_stress_test.cc
+++ b/src/ray/object_manager/test/object_manager_stress_test.cc
@@ -106,7 +106,7 @@ class TestObjectManagerBase : public ::testing::Test {
     return store_id;
   }
 
-  void StopStore(std::string store_id) {
+  void StopStore(const std::string &store_id) {
     std::string store_pid = store_id + ".pid";
     std::string kill_1 = "kill -9 `cat " + store_pid + "`";
     int s = system(kill_1.c_str());
@@ -120,7 +120,7 @@ class TestObjectManagerBase : public ::testing::Test {
     store_id_1 = StartStore(UniqueID::from_random().hex());
     store_id_2 = StartStore(UniqueID::from_random().hex());
 
-    uint pull_timeout_ms = 1;
+    uint pull_timeout_ms = 1000;
     int max_sends_a = 2;
     int max_receives_a = 2;
     int max_sends_b = 3;
@@ -257,7 +257,7 @@ class StressTestObjectManager : public TestObjectManagerBase {
   void AddTransferTestHandlers() {
     ray::Status status = ray::Status::OK();
     status = server1->object_manager_.SubscribeObjAdded(
-        [this](const ObjectInfoT &object_info) {
+        [this](const object_manager::protocol::ObjectInfoT &object_info) {
           object_added_handler_1(ObjectID::from_binary(object_info.object_id));
           if (v1.size() == num_expected_objects && v1.size() == v2.size()) {
             TransferTestComplete();
@@ -265,7 +265,7 @@ class StressTestObjectManager : public TestObjectManagerBase {
         });
     RAY_CHECK_OK(status);
     status = server2->object_manager_.SubscribeObjAdded(
-        [this](const ObjectInfoT &object_info) {
+        [this](const object_manager::protocol::ObjectInfoT &object_info) {
           object_added_handler_2(ObjectID::from_binary(object_info.object_id));
           if (v2.size() == num_expected_objects && v1.size() == v2.size()) {
             TransferTestComplete();
@@ -433,11 +433,13 @@ class StressTestObjectManager : public TestObjectManagerBase {
     RAY_LOG(DEBUG) << "\n"
                    << "All connected clients:"
                    << "\n";
-    const ClientTableDataT &data = gcs_client_1->client_table().GetClient(client_id_1);
+    ClientTableDataT data;
+    gcs_client_1->client_table().GetClient(client_id_1, data);
     RAY_LOG(DEBUG) << "ClientID=" << ClientID::from_binary(data.client_id) << "\n"
                    << "ClientIp=" << data.node_manager_address << "\n"
                    << "ClientPort=" << data.node_manager_port;
-    const ClientTableDataT &data2 = gcs_client_1->client_table().GetClient(client_id_2);
+    ClientTableDataT data2;
+    gcs_client_1->client_table().GetClient(client_id_2, data2);
     RAY_LOG(DEBUG) << "ClientID=" << ClientID::from_binary(data2.client_id) << "\n"
                    << "ClientIp=" << data2.node_manager_address << "\n"
                    << "ClientPort=" << data2.node_manager_port;
diff --git a/src/ray/object_manager/test/object_manager_test.cc b/src/ray/object_manager/test/object_manager_test.cc
index 68cd0f156ff2a..cb98706753d91 100644
--- a/src/ray/object_manager/test/object_manager_test.cc
+++ b/src/ray/object_manager/test/object_manager_test.cc
@@ -232,13 +232,13 @@ class TestObjectManager : public TestObjectManagerBase {
   void TestNotifications() {
     ray::Status status = ray::Status::OK();
     status = server1->object_manager_.SubscribeObjAdded(
-        [this](const ObjectInfoT &object_info) {
+        [this](const object_manager::protocol::ObjectInfoT &object_info) {
           object_added_handler_1(ObjectID::from_binary(object_info.object_id));
           NotificationTestCompleteIfSatisfied();
         });
     RAY_CHECK_OK(status);
     status = server2->object_manager_.SubscribeObjAdded(
-        [this](const ObjectInfoT &object_info) {
+        [this](const object_manager::protocol::ObjectInfoT &object_info) {
           object_added_handler_2(ObjectID::from_binary(object_info.object_id));
           NotificationTestCompleteIfSatisfied();
         });
@@ -447,13 +447,15 @@ class TestObjectManager : public TestObjectManagerBase {
     RAY_LOG(DEBUG) << "\n"
                    << "Server client ids:"
                    << "\n";
-    const ClientTableDataT &data = gcs_client_1->client_table().GetClient(client_id_1);
+    ClientTableDataT data;
+    gcs_client_1->client_table().GetClient(client_id_1, data);
     RAY_LOG(DEBUG) << (ClientID::from_binary(data.client_id) == ClientID::nil());
     RAY_LOG(DEBUG) << "Server 1 ClientID=" << ClientID::from_binary(data.client_id);
     RAY_LOG(DEBUG) << "Server 1 ClientIp=" << data.node_manager_address;
     RAY_LOG(DEBUG) << "Server 1 ClientPort=" << data.node_manager_port;
     ASSERT_EQ(client_id_1, ClientID::from_binary(data.client_id));
-    const ClientTableDataT &data2 = gcs_client_1->client_table().GetClient(client_id_2);
+    ClientTableDataT data2;
+    gcs_client_1->client_table().GetClient(client_id_2, data2);
     RAY_LOG(DEBUG) << "Server 2 ClientID=" << ClientID::from_binary(data2.client_id);
     RAY_LOG(DEBUG) << "Server 2 ClientIp=" << data2.node_manager_address;
     RAY_LOG(DEBUG) << "Server 2 ClientPort=" << data2.node_manager_port;
diff --git a/src/common/state/ray_config.h b/src/ray/ray_config.h
similarity index 59%
rename from src/common/state/ray_config.h
rename to src/ray/ray_config.h
index d4ae3cea87802..97767fc3f396b 100644
--- a/src/common/state/ray_config.h
+++ b/src/ray/ray_config.h
@@ -1,7 +1,9 @@
 #ifndef RAY_CONFIG_H
 #define RAY_CONFIG_H
 
-#include <stdint.h>
+#include <unordered_map>
+
+#include "ray/util/logging.h"
 
 class RayConfig {
  public:
@@ -12,14 +14,16 @@ class RayConfig {
 
   int64_t ray_protocol_version() const { return ray_protocol_version_; }
 
-  uint64_t handler_warning_timeout_ms() const {
-    return handler_warning_timeout_ms_;
-  }
+  int64_t handler_warning_timeout_ms() const { return handler_warning_timeout_ms_; }
 
   int64_t heartbeat_timeout_milliseconds() const {
     return heartbeat_timeout_milliseconds_;
   }
 
+  int64_t debug_dump_period_milliseconds() const {
+    return debug_dump_period_milliseconds_;
+  }
+
   int64_t num_heartbeats_timeout() const { return num_heartbeats_timeout_; }
 
   uint64_t num_heartbeats_warning() const { return num_heartbeats_warning_; }
@@ -34,17 +38,13 @@ class RayConfig {
 
   int64_t worker_get_request_size() const { return worker_get_request_size_; }
 
-  int64_t worker_fetch_request_size() const {
-    return worker_fetch_request_size_;
-  }
+  int64_t worker_fetch_request_size() const { return worker_fetch_request_size_; }
 
   int64_t actor_max_dummy_objects() const { return actor_max_dummy_objects_; }
 
   int64_t num_connect_attempts() const { return num_connect_attempts_; }
 
-  int64_t connect_timeout_milliseconds() const {
-    return connect_timeout_milliseconds_;
-  }
+  int64_t connect_timeout_milliseconds() const { return connect_timeout_milliseconds_; }
 
   int64_t local_scheduler_fetch_timeout_milliseconds() const {
     return local_scheduler_fetch_timeout_milliseconds_;
@@ -64,9 +64,7 @@ class RayConfig {
     return kill_worker_timeout_milliseconds_;
   }
 
-  int64_t manager_timeout_milliseconds() const {
-    return manager_timeout_milliseconds_;
-  }
+  int64_t manager_timeout_milliseconds() const { return manager_timeout_milliseconds_; }
 
   int64_t buf_size() const { return buf_size_; }
 
@@ -86,9 +84,7 @@ class RayConfig {
     return redis_db_connect_wait_milliseconds_;
   };
 
-  int64_t plasma_default_release_delay() const {
-    return plasma_default_release_delay_;
-  }
+  int64_t plasma_default_release_delay() const { return plasma_default_release_delay_; }
 
   int64_t L3_cache_size_bytes() const { return L3_cache_size_bytes_; }
 
@@ -102,35 +98,119 @@ class RayConfig {
     return node_manager_forward_task_retry_timeout_milliseconds_;
   }
 
-  int object_manager_pull_timeout_ms() const {
-    return object_manager_pull_timeout_ms_;
-  }
+  int object_manager_pull_timeout_ms() const { return object_manager_pull_timeout_ms_; }
 
-  int object_manager_push_timeout_ms() const {
-    return object_manager_push_timeout_ms_;
-  }
+  int object_manager_push_timeout_ms() const { return object_manager_push_timeout_ms_; }
 
+  int object_manager_repeated_push_delay_ms() const {
+    return object_manager_repeated_push_delay_ms_;
+  }
   uint64_t object_manager_default_chunk_size() const {
     return object_manager_default_chunk_size_;
   }
 
   int num_workers_per_process() const { return num_workers_per_process_; }
 
+  void initialize(const std::unordered_map<std::string, int> &config_map) {
+    RAY_CHECK(!initialized_);
+    for (auto const &pair : config_map) {
+      // We use a big chain of if else statements because C++ doesn't allow
+      // switch statements on strings.
+      if (pair.first == "ray_protocol_version") {
+        ray_protocol_version_ = pair.second;
+      } else if (pair.first == "handler_warning_timeout_ms") {
+        handler_warning_timeout_ms_ = pair.second;
+      } else if (pair.first == "heartbeat_timeout_milliseconds") {
+        heartbeat_timeout_milliseconds_ = pair.second;
+      } else if (pair.first == "debug_dump_period_milliseconds") {
+        debug_dump_period_milliseconds_ = pair.second;
+      } else if (pair.first == "num_heartbeats_timeout") {
+        num_heartbeats_timeout_ = pair.second;
+      } else if (pair.first == "num_heartbeats_warning") {
+        num_heartbeats_warning_ = pair.second;
+      } else if (pair.first == "initial_reconstruction_timeout_milliseconds") {
+        initial_reconstruction_timeout_milliseconds_ = pair.second;
+      } else if (pair.first == "get_timeout_milliseconds") {
+        get_timeout_milliseconds_ = pair.second;
+      } else if (pair.first == "worker_get_request_size") {
+        worker_get_request_size_ = pair.second;
+      } else if (pair.first == "worker_fetch_request_size") {
+        worker_fetch_request_size_ = pair.second;
+      } else if (pair.first == "max_lineage_size") {
+        max_lineage_size_ = pair.second;
+      } else if (pair.first == "actor_max_dummy_objects") {
+        actor_max_dummy_objects_ = pair.second;
+      } else if (pair.first == "num_connect_attempts") {
+        num_connect_attempts_ = pair.second;
+      } else if (pair.first == "connect_timeout_milliseconds") {
+        connect_timeout_milliseconds_ = pair.second;
+      } else if (pair.first == "local_scheduler_fetch_timeout_milliseconds") {
+        local_scheduler_fetch_timeout_milliseconds_ = pair.second;
+      } else if (pair.first == "local_scheduler_reconstruction_timeout_milliseconds") {
+        local_scheduler_reconstruction_timeout_milliseconds_ = pair.second;
+      } else if (pair.first == "max_num_to_reconstruct") {
+        max_num_to_reconstruct_ = pair.second;
+      } else if (pair.first == "local_scheduler_fetch_request_size") {
+        local_scheduler_fetch_request_size_ = pair.second;
+      } else if (pair.first == "kill_worker_timeout_milliseconds") {
+        kill_worker_timeout_milliseconds_ = pair.second;
+      } else if (pair.first == "manager_timeout_milliseconds") {
+        manager_timeout_milliseconds_ = pair.second;
+      } else if (pair.first == "buf_size") {
+        buf_size_ = pair.second;
+      } else if (pair.first == "max_time_for_handler_milliseconds") {
+        max_time_for_handler_milliseconds_ = pair.second;
+      } else if (pair.first == "size_limit") {
+        size_limit_ = pair.second;
+      } else if (pair.first == "num_elements_limit") {
+        num_elements_limit_ = pair.second;
+      } else if (pair.first == "max_time_for_loop") {
+        max_time_for_loop_ = pair.second;
+      } else if (pair.first == "redis_db_connect_retries") {
+        redis_db_connect_retries_ = pair.second;
+      } else if (pair.first == "redis_db_connect_wait_milliseconds") {
+        redis_db_connect_wait_milliseconds_ = pair.second;
+      } else if (pair.first == "plasma_default_release_delay") {
+        plasma_default_release_delay_ = pair.second;
+      } else if (pair.first == "L3_cache_size_bytes") {
+        L3_cache_size_bytes_ = pair.second;
+      } else if (pair.first == "max_tasks_to_spillback") {
+        max_tasks_to_spillback_ = pair.second;
+      } else if (pair.first == "actor_creation_num_spillbacks_warning") {
+        actor_creation_num_spillbacks_warning_ = pair.second;
+      } else if (pair.first == "node_manager_forward_task_retry_timeout_milliseconds") {
+        node_manager_forward_task_retry_timeout_milliseconds_ = pair.second;
+      } else if (pair.first == "object_manager_pull_timeout_ms") {
+        object_manager_pull_timeout_ms_ = pair.second;
+      } else if (pair.first == "object_manager_push_timeout_ms") {
+        object_manager_push_timeout_ms_ = pair.second;
+      } else if (pair.first == "object_manager_default_chunk_size") {
+        object_manager_default_chunk_size_ = pair.second;
+      } else if (pair.first == "object_manager_repeated_push_delay_ms") {
+        object_manager_repeated_push_delay_ms_ = pair.second;
+      } else {
+        RAY_LOG(FATAL) << "Received unexpected config parameter " << pair.first;
+      }
+    }
+    initialized_ = true;
+  }
+
  private:
   RayConfig()
       : ray_protocol_version_(0x0000000000000000),
         handler_warning_timeout_ms_(100),
         heartbeat_timeout_milliseconds_(100),
-        num_heartbeats_timeout_(100),
+        num_heartbeats_timeout_(300),
         num_heartbeats_warning_(5),
-        initial_reconstruction_timeout_milliseconds_(200),
+        debug_dump_period_milliseconds_(10000),
+        initial_reconstruction_timeout_milliseconds_(10000),
         get_timeout_milliseconds_(1000),
         worker_get_request_size_(10000),
         worker_fetch_request_size_(10000),
         max_lineage_size_(100),
         actor_max_dummy_objects_(1000),
-        num_connect_attempts_(50),
-        connect_timeout_milliseconds_(100),
+        num_connect_attempts_(5),
+        connect_timeout_milliseconds_(500),
         local_scheduler_fetch_timeout_milliseconds_(1000),
         local_scheduler_reconstruction_timeout_milliseconds_(1000),
         max_num_to_reconstruct_(10000),
@@ -149,10 +229,12 @@ class RayConfig {
         max_tasks_to_spillback_(10),
         actor_creation_num_spillbacks_warning_(100),
         node_manager_forward_task_retry_timeout_milliseconds_(1000),
-        object_manager_pull_timeout_ms_(100),
+        object_manager_pull_timeout_ms_(10000),
         object_manager_push_timeout_ms_(10000),
+        object_manager_repeated_push_delay_ms_(60000),
         object_manager_default_chunk_size_(1000000),
-        num_workers_per_process_(1) {}
+        num_workers_per_process_(1),
+        initialized_(false) {}
 
   ~RayConfig() {}
 
@@ -161,7 +243,7 @@ class RayConfig {
 
   /// The duration that a single handler on the event loop can take before a
   /// warning is logged that the handler is taking too long.
-  uint64_t handler_warning_timeout_ms_;
+  int64_t handler_warning_timeout_ms_;
 
   /// The duration between heartbeats. These are sent by the plasma manager and
   /// local scheduler.
@@ -175,6 +257,9 @@ class RayConfig {
   /// handler is drifting.
   uint64_t num_heartbeats_warning_;
 
+  /// The duration between dumping debug info to logs, or -1 to disable.
+  int64_t debug_dump_period_milliseconds_;
+
   /// The initial period for a task execution lease. The lease will expire this
   /// many milliseconds after the first acquisition of the lease. Nodes that
   /// require an object will not try to reconstruct the task until at least
@@ -269,6 +354,10 @@ class RayConfig {
   /// 0: giving up retrying immediately.
   int object_manager_push_timeout_ms_;
 
+  /// The period of time that an object manager will wait before pushing the
+  /// same object again to a specific object manager.
+  int object_manager_repeated_push_delay_ms_;
+
   /// Default chunk size for multi-chunk transfers to use in the object manager.
   /// In the object manager, no single thread is permitted to transfer more
   /// data than what is specified by the chunk size unless the number of object
@@ -277,6 +366,10 @@ class RayConfig {
 
   /// Number of workers per process
   int num_workers_per_process_;
+
+  /// Whether the initialization of the instance has been called before.
+  /// The RayConfig instance can only (and must) be initialized once.
+  bool initialized_;
 };
 
 #endif  // RAY_CONFIG_H
diff --git a/src/ray/raylet/CMakeLists.txt b/src/ray/raylet/CMakeLists.txt
index 79233965af0cf..2faac13d02beb 100644
--- a/src/ray/raylet/CMakeLists.txt
+++ b/src/ray/raylet/CMakeLists.txt
@@ -1,3 +1,5 @@
+set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fPIC")
+
 set(NODE_MANAGER_FBS_SRC "${CMAKE_CURRENT_LIST_DIR}/format/node_manager.fbs")
 set(OUTPUT_DIR ${CMAKE_CURRENT_LIST_DIR}/format/)
 
@@ -32,6 +34,7 @@ ADD_RAY_TEST(object_manager_integration_test STATIC_LINK_LIBS ray_static ${PLASM
 
 ADD_RAY_TEST(worker_pool_test STATIC_LINK_LIBS ray_static ${PLASMA_STATIC_LIB} ${ARROW_STATIC_LIB} gtest gtest_main gmock_main pthread ${Boost_SYSTEM_LIBRARY})
 
+ADD_RAY_TEST(client_connection_test STATIC_LINK_LIBS ray_static gtest gtest_main gmock_main pthread ${Boost_SYSTEM_LIBRARY})
 ADD_RAY_TEST(task_test STATIC_LINK_LIBS ray_static gtest gtest_main gmock_main pthread ${Boost_SYSTEM_LIBRARY})
 ADD_RAY_TEST(lineage_cache_test STATIC_LINK_LIBS ray_static gtest gtest_main gmock_main pthread ${Boost_SYSTEM_LIBRARY})
 ADD_RAY_TEST(task_dependency_manager_test STATIC_LINK_LIBS ray_static gtest gtest_main gmock_main pthread ${Boost_SYSTEM_LIBRARY})
@@ -41,6 +44,13 @@ include_directories(${GCS_FBS_OUTPUT_DIRECTORY})
 add_library(rayletlib raylet.cc ${NODE_MANAGER_FBS_OUTPUT_FILES})
 target_link_libraries(rayletlib ray_static ${Boost_SYSTEM_LIBRARY})
 
+add_library(local_scheduler_client STATIC local_scheduler_client.cc)
+
+# Encode the fact that some things require some autogenerated flatbuffer files
+# to be created first.
+add_dependencies(rayletlib gen_gcs_fbs)
+add_dependencies(local_scheduler_client gen_gcs_fbs arrow_ep gen_node_manager_fbs)
+
 add_executable(raylet main.cc)
 target_link_libraries(raylet rayletlib ${Boost_SYSTEM_LIBRARY} pthread)
 
@@ -50,3 +60,48 @@ target_link_libraries(raylet_monitor rayletlib ${Boost_SYSTEM_LIBRARY} pthread)
 install(FILES
         raylet
         DESTINATION "${CMAKE_INSTALL_INCLUDEDIR}/ray/raylet")
+
+macro(get_local_scheduler_library LANG VAR)
+  set(${VAR} "local_scheduler_library_${LANG}")
+endmacro()
+
+macro(set_local_scheduler_library LANG)
+  get_local_scheduler_library(${LANG} LOCAL_SCHEDULER_LIBRARY_${LANG})
+  set(LOCAL_SCHEDULER_LIBRARY_LANG ${LOCAL_SCHEDULER_LIBRARY_${LANG}})
+
+  file(GLOB LOCAL_SCHEDULER_LIBRARY_${LANG}_SRC
+    lib/${LANG}/*.cc)
+  add_library(${LOCAL_SCHEDULER_LIBRARY_LANG} SHARED
+    ${LOCAL_SCHEDULER_LIBRARY_${LANG}_SRC})
+
+    if(APPLE)
+      if ("${LANG}" STREQUAL "python")
+        SET_TARGET_PROPERTIES(${LOCAL_SCHEDULER_LIBRARY_LANG} PROPERTIES SUFFIX .so)
+      endif()
+      target_link_libraries(${LOCAL_SCHEDULER_LIBRARY_LANG} "-undefined dynamic_lookup" local_scheduler_client ray_static ${PLASMA_STATIC_LIB} ${ARROW_STATIC_LIB} ${Boost_SYSTEM_LIBRARY})
+    else(APPLE)
+      target_link_libraries(${LOCAL_SCHEDULER_LIBRARY_LANG} local_scheduler_client ray_static ${PLASMA_STATIC_LIB} ${ARROW_STATIC_LIB} ${Boost_SYSTEM_LIBRARY})
+    endif(APPLE)
+
+  add_dependencies(${LOCAL_SCHEDULER_LIBRARY_LANG} gen_node_manager_fbs)
+
+  install(TARGETS ${LOCAL_SCHEDULER_LIBRARY_LANG} DESTINATION ${CMAKE_SOURCE_DIR}/local_scheduler)
+endmacro()
+
+if ("${CMAKE_RAY_LANG_PYTHON}" STREQUAL "YES")
+  set_local_scheduler_library("python")
+  include_directories("${PYTHON_INCLUDE_DIRS}")
+  include_directories("${NUMPY_INCLUDE_DIR}")
+endif()
+
+if ("${CMAKE_RAY_LANG_JAVA}" STREQUAL "YES")
+  add_compile_options("-I$ENV{JAVA_HOME}/include/")
+  if(WIN32)
+    add_compile_options("-I$ENV{JAVA_HOME}/include/win32")
+  elseif(APPLE)
+    add_compile_options("-I$ENV{JAVA_HOME}/include/darwin")
+  else() # linux
+    add_compile_options("-I$ENV{JAVA_HOME}/include/linux")
+  endif()
+  set_local_scheduler_library("java")
+endif()
diff --git a/src/ray/raylet/actor_registration.cc b/src/ray/raylet/actor_registration.cc
index ced923609e08a..7ea95e6566426 100644
--- a/src/ray/raylet/actor_registration.cc
+++ b/src/ray/raylet/actor_registration.cc
@@ -1,5 +1,7 @@
 #include "ray/raylet/actor_registration.h"
 
+#include <sstream>
+
 #include "ray/util/logging.h"
 
 namespace ray {
@@ -8,7 +10,6 @@ namespace raylet {
 
 ActorRegistration::ActorRegistration(const ActorTableDataT &actor_table_data)
     : actor_table_data_(actor_table_data),
-      alive_(true),
       execution_dependency_(ObjectID::nil()),
       frontier_() {}
 
@@ -35,11 +36,14 @@ void ActorRegistration::ExtendFrontier(const ActorHandleID &handle_id,
   frontier_entry.task_counter++;
   frontier_entry.execution_dependency = execution_dependency;
   execution_dependency_ = execution_dependency;
+  dummy_objects_.push_back(execution_dependency);
 }
 
-bool ActorRegistration::IsAlive() const { return alive_; }
+bool ActorRegistration::IsAlive() const {
+  return actor_table_data_.state == ActorState::ALIVE;
+}
 
-void ActorRegistration::MarkDead() { alive_ = false; }
+int ActorRegistration::NumHandles() const { return frontier_.size(); }
 
 }  // namespace raylet
 
diff --git a/src/ray/raylet/actor_registration.h b/src/ray/raylet/actor_registration.h
index bd16e4f46a505..4cf9b110afe12 100644
--- a/src/ray/raylet/actor_registration.h
+++ b/src/ray/raylet/actor_registration.h
@@ -36,6 +36,16 @@ class ActorRegistration {
     ObjectID execution_dependency;
   };
 
+  /// Get the actor table data.
+  ///
+  /// \return The actor table data.
+  const ActorTableDataT &GetTableData() const { return actor_table_data_; }
+
+  /// Get the actor's current state (ALIVE or DEAD).
+  ///
+  /// \return The actor's current state.
+  const ActorState &GetState() const { return actor_table_data_.state; }
+
   /// Get the actor's node manager location.
   ///
   /// \return The actor's node manager location. All tasks for the actor should
@@ -66,6 +76,9 @@ class ActorRegistration {
   /// that handle.
   const std::unordered_map<ActorHandleID, FrontierLeaf> &GetFrontier() const;
 
+  /// Get all the dummy objects of this actor's tasks.
+  const std::vector<ObjectID> &GetDummyObjects() const { return dummy_objects_; }
+
   /// Extend the frontier of the actor by a single task. This should be called
   /// whenever the actor executes a task.
   ///
@@ -81,16 +94,15 @@ class ActorRegistration {
   /// \return True if the local actor is alive and false if it is dead.
   bool IsAlive() const;
 
-  /// Mark the actor as dead.
-  /// \return Void.
-  void MarkDead();
+  /// Returns num handles to this actor entry.
+  ///
+  /// \return int.
+  int NumHandles() const;
 
  private:
   /// Information from the global actor table about this actor, including the
   /// node manager location.
   ActorTableDataT actor_table_data_;
-  /// True if the actor is alive and false otherwise.
-  bool alive_;
   /// The object representing the state following the actor's most recently
   /// executed task. The next task to execute on the actor should be marked as
   /// execution-dependent on this object.
@@ -99,6 +111,8 @@ class ActorRegistration {
   /// executed so far and which tasks may execute next, based on execution
   /// dependencies. This is indexed by handle.
   std::unordered_map<ActorHandleID, FrontierLeaf> frontier_;
+  /// All of the dummy object IDs from this actor's tasks.
+  std::vector<ObjectID> dummy_objects_;
 };
 
 }  // namespace raylet
diff --git a/src/ray/raylet/client_connection_test.cc b/src/ray/raylet/client_connection_test.cc
new file mode 100644
index 0000000000000..a68a6535c1e81
--- /dev/null
+++ b/src/ray/raylet/client_connection_test.cc
@@ -0,0 +1,155 @@
+#include <list>
+#include <memory>
+
+#include <boost/asio.hpp>
+#include <boost/asio/error.hpp>
+#include "gmock/gmock.h"
+#include "gtest/gtest.h"
+
+#include "ray/common/client_connection.h"
+
+namespace ray {
+namespace raylet {
+
+class ClientConnectionTest : public ::testing::Test {
+ public:
+  ClientConnectionTest() : io_service_(), in_(io_service_), out_(io_service_) {
+    boost::asio::local::connect_pair(in_, out_);
+  }
+
+ protected:
+  boost::asio::io_service io_service_;
+  boost::asio::local::stream_protocol::socket in_;
+  boost::asio::local::stream_protocol::socket out_;
+};
+
+TEST_F(ClientConnectionTest, SimpleSyncWrite) {
+  const uint8_t arr[5] = {1, 2, 3, 4, 5};
+  int num_messages = 0;
+
+  ClientHandler<boost::asio::local::stream_protocol> client_handler =
+      [](LocalClientConnection &client) {};
+
+  MessageHandler<boost::asio::local::stream_protocol> message_handler =
+      [&arr, &num_messages](std::shared_ptr<LocalClientConnection> client,
+                            int64_t message_type, const uint8_t *message) {
+        ASSERT_TRUE(!std::memcmp(arr, message, 5));
+        num_messages += 1;
+      };
+
+  auto conn1 = LocalClientConnection::Create(client_handler, message_handler,
+                                             std::move(in_), "conn1");
+
+  auto conn2 = LocalClientConnection::Create(client_handler, message_handler,
+                                             std::move(out_), "conn2");
+
+  RAY_CHECK_OK(conn1->WriteMessage(0, 5, arr));
+  RAY_CHECK_OK(conn2->WriteMessage(0, 5, arr));
+  conn1->ProcessMessages();
+  conn2->ProcessMessages();
+  io_service_.run();
+  ASSERT_EQ(num_messages, 2);
+}
+
+TEST_F(ClientConnectionTest, SimpleAsyncWrite) {
+  const uint8_t msg1[5] = {1, 2, 3, 4, 5};
+  const uint8_t msg2[5] = {4, 4, 4, 4, 4};
+  const uint8_t msg3[5] = {8, 8, 8, 8, 8};
+  int num_messages = 0;
+
+  ClientHandler<boost::asio::local::stream_protocol> client_handler =
+      [](LocalClientConnection &client) {};
+
+  MessageHandler<boost::asio::local::stream_protocol> noop_handler = [](
+      std::shared_ptr<LocalClientConnection> client, int64_t message_type,
+      const uint8_t *message) {};
+
+  std::shared_ptr<LocalClientConnection> reader = NULL;
+
+  MessageHandler<boost::asio::local::stream_protocol> message_handler =
+      [&msg1, &msg2, &msg3, &num_messages, &reader](
+          std::shared_ptr<LocalClientConnection> client, int64_t message_type,
+          const uint8_t *message) {
+        if (num_messages == 0) {
+          ASSERT_TRUE(!std::memcmp(msg1, message, 5));
+        } else if (num_messages == 1) {
+          ASSERT_TRUE(!std::memcmp(msg2, message, 5));
+        } else {
+          ASSERT_TRUE(!std::memcmp(msg3, message, 5));
+        }
+        num_messages += 1;
+        if (num_messages < 3) {
+          reader->ProcessMessages();
+        }
+      };
+
+  auto writer = LocalClientConnection::Create(client_handler, noop_handler,
+                                              std::move(in_), "writer");
+
+  reader = LocalClientConnection::Create(client_handler, message_handler, std::move(out_),
+                                         "reader");
+
+  std::function<void(const ray::Status &)> callback = [](const ray::Status &status) {
+    RAY_CHECK_OK(status);
+  };
+
+  writer->WriteMessageAsync(0, 5, msg1, callback);
+  writer->WriteMessageAsync(0, 5, msg2, callback);
+  writer->WriteMessageAsync(0, 5, msg3, callback);
+  reader->ProcessMessages();
+  io_service_.run();
+  ASSERT_EQ(num_messages, 3);
+}
+
+TEST_F(ClientConnectionTest, SimpleAsyncError) {
+  const uint8_t msg1[5] = {1, 2, 3, 4, 5};
+
+  ClientHandler<boost::asio::local::stream_protocol> client_handler =
+      [](LocalClientConnection &client) {};
+
+  MessageHandler<boost::asio::local::stream_protocol> noop_handler = [](
+      std::shared_ptr<LocalClientConnection> client, int64_t message_type,
+      const uint8_t *message) {};
+
+  auto writer = LocalClientConnection::Create(client_handler, noop_handler,
+                                              std::move(in_), "writer");
+
+  std::function<void(const ray::Status &)> callback = [](const ray::Status &status) {
+    ASSERT_TRUE(!status.ok());
+  };
+
+  writer->Close();
+  writer->WriteMessageAsync(0, 5, msg1, callback);
+  io_service_.run();
+}
+
+TEST_F(ClientConnectionTest, CallbackWithSharedRefDoesNotLeakConnection) {
+  const uint8_t msg1[5] = {1, 2, 3, 4, 5};
+
+  ClientHandler<boost::asio::local::stream_protocol> client_handler =
+      [](LocalClientConnection &client) {};
+
+  MessageHandler<boost::asio::local::stream_protocol> noop_handler = [](
+      std::shared_ptr<LocalClientConnection> client, int64_t message_type,
+      const uint8_t *message) {};
+
+  auto writer = LocalClientConnection::Create(client_handler, noop_handler,
+                                              std::move(in_), "writer");
+
+  std::function<void(const ray::Status &)> callback =
+      [writer](const ray::Status &status) {
+        static_cast<void>(writer);
+        ASSERT_TRUE(status.ok());
+      };
+  writer->WriteMessageAsync(0, 5, msg1, callback);
+  io_service_.run();
+}
+
+}  // namespace raylet
+
+}  // namespace ray
+
+int main(int argc, char **argv) {
+  ::testing::InitGoogleTest(&argc, argv);
+  return RUN_ALL_TESTS();
+}
diff --git a/src/ray/raylet/format/node_manager.fbs b/src/ray/raylet/format/node_manager.fbs
index 4ede8f2b3e703..1e62202d79129 100644
--- a/src/ray/raylet/format/node_manager.fbs
+++ b/src/ray/raylet/format/node_manager.fbs
@@ -23,9 +23,12 @@ enum MessageType:int {
   // Send a reply confirming the successful registration of a worker or driver.
   // This is sent from the local scheduler to a worker or driver.
   RegisterClientReply,
-  // Notify the local scheduler that this client is disconnecting gracefully.
+  // Notify the local scheduler that this client is disconnecting unexpectedly.
   // This is sent from a worker to a local scheduler.
   DisconnectClient,
+  // Notify the local scheduler that this client is disconnecting gracefully.
+  // This is sent from a worker to a local scheduler.
+  IntentionalDisconnectClient,
   // Get a new task from the local scheduler. This is sent from a worker to a
   // local scheduler.
   GetTask,
@@ -34,13 +37,11 @@ enum MessageType:int {
   ExecuteTask,
   // Reconstruct or fetch possibly lost objects. This is sent from a worker to
   // a local scheduler.
-  ReconstructObjects,
+  FetchOrReconstruct,
   // For a worker that was blocked on some object(s), tell the local scheduler
   // that the worker is now unblocked. This is sent from a worker to a local
   // scheduler.
   NotifyUnblocked,
-  // Add a result table entry for an object put.
-  PutObject,
   // A request to get the task frontier for an actor, called by the actor when
   // saving a checkpoint.
   GetActorFrontierRequest,
@@ -104,6 +105,10 @@ table ResourceIdSetInfo {
   resource_fractions: [double];
 }
 
+// This message is sent from a worker to the node manager.
+table DisconnectClient {
+}
+
 // This message is sent from the local scheduler to a worker.
 table GetTaskReply {
   // A string of bytes representing the task specification.
@@ -145,11 +150,18 @@ table ForwardTaskRequest {
   uncommitted_tasks: [Task];
 }
 
-table ReconstructObjects {
+table FetchOrReconstruct {
   // List of object IDs of the objects that we want to reconstruct or fetch.
   object_ids: [string];
   // Do we only want to fetch the objects or also reconstruct them?
   fetch_only: bool;
+  // The current task ID. If fetch_only is false, then this task is blocked.
+  task_id: string;
+}
+
+table NotifyUnblocked {
+  // The current task ID. This task is no longer blocked.
+  task_id: string;
 }
 
 table WaitRequest {
@@ -161,6 +173,9 @@ table WaitRequest {
   timeout: long;
   // Whether to wait until objects appear locally.
   wait_local: bool;
+  // The current task ID. If there are less than num_ready_objects local, then
+  // this task is blocked.
+  task_id: string;
 }
 
 table WaitReply {
@@ -183,7 +198,7 @@ table PushErrorRequest {
 }
 
 table FreeObjectsRequest {
-  // Whether keep this request with local object store 
+  // Whether keep this request with local object store
   // or send it to all the object stores.
   local_only: bool;
   // List of object ids we'll delete from object store.
diff --git a/src/local_scheduler/lib/java/org_ray_runtime_raylet_RayletClientImpl.cc b/src/ray/raylet/lib/java/org_ray_runtime_raylet_RayletClientImpl.cc
similarity index 62%
rename from src/local_scheduler/lib/java/org_ray_runtime_raylet_RayletClientImpl.cc
rename to src/ray/raylet/lib/java/org_ray_runtime_raylet_RayletClientImpl.cc
index d8cfea804a271..c3b1b4475aa76 100644
--- a/src/local_scheduler/lib/java/org_ray_runtime_raylet_RayletClientImpl.cc
+++ b/src/ray/raylet/lib/java/org_ray_runtime_raylet_RayletClientImpl.cc
@@ -1,9 +1,10 @@
+#include "ray/raylet/lib/java/org_ray_runtime_raylet_RayletClientImpl.h"
+
 #include <jni.h>
 
-#include "local_scheduler/lib/java/org_ray_runtime_raylet_RayletClientImpl.h"
-#include "local_scheduler_client.h"
-#include "logging.h"
 #include "ray/id.h"
+#include "ray/raylet/local_scheduler_client.h"
+#include "ray/util/logging.h"
 
 #ifdef __cplusplus
 extern "C" {
@@ -21,8 +22,7 @@ class UniqueIdFromJByteArray {
     _env = env;
     _bytes = wid;
 
-    jbyte *b =
-        reinterpret_cast<jbyte *>(_env->GetByteArrayElements(_bytes, nullptr));
+    jbyte *b = reinterpret_cast<jbyte *>(_env->GetByteArrayElements(_bytes, nullptr));
     PID = reinterpret_cast<UniqueID *>(b);
   }
 
@@ -36,19 +36,14 @@ class UniqueIdFromJByteArray {
  * Method:    nativeInit
  * Signature: (Ljava/lang/String;[BZ[B)J
  */
-JNIEXPORT jlong JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeInit(JNIEnv *env,
-                                                        jclass,
-                                                        jstring sockName,
-                                                        jbyteArray workerId,
-                                                        jboolean isWorker,
-                                                        jbyteArray driverId) {
+JNIEXPORT jlong JNICALL Java_org_ray_runtime_raylet_RayletClientImpl_nativeInit(
+    JNIEnv *env, jclass, jstring sockName, jbyteArray workerId, jboolean isWorker,
+    jbyteArray driverId) {
   UniqueIdFromJByteArray worker_id(env, workerId);
   UniqueIdFromJByteArray driver_id(env, driverId);
   const char *nativeString = env->GetStringUTFChars(sockName, JNI_FALSE);
-  auto client =
-      LocalSchedulerConnection_init(nativeString, *worker_id.PID, isWorker,
-                                    *driver_id.PID, true, Language::JAVA);
+  auto client = LocalSchedulerConnection_init(nativeString, *worker_id.PID, isWorker,
+                                              *driver_id.PID, Language::JAVA);
   env->ReleaseStringUTFChars(sockName, nativeString);
   return reinterpret_cast<jlong>(client);
 }
@@ -58,14 +53,8 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativeInit(JNIEnv *env,
  * Method:    nativeSubmitTask
  * Signature: (J[BLjava/nio/ByteBuffer;II)V
  */
-JNIEXPORT void JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeSubmitTask(
-    JNIEnv *env,
-    jclass,
-    jlong client,
-    jbyteArray cursorId,
-    jobject taskBuff,
-    jint pos,
+JNIEXPORT void JNICALL Java_org_ray_runtime_raylet_RayletClientImpl_nativeSubmitTask(
+    JNIEnv *env, jclass, jlong client, jbyteArray cursorId, jobject taskBuff, jint pos,
     jint taskSize) {
   auto conn = reinterpret_cast<LocalSchedulerConnection *>(client);
 
@@ -75,8 +64,7 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativeSubmitTask(
     execution_dependencies.push_back(*cursor_id.PID);
   }
 
-  auto data =
-      reinterpret_cast<char *>(env->GetDirectBufferAddress(taskBuff)) + pos;
+  auto data = reinterpret_cast<char *>(env->GetDirectBufferAddress(taskBuff)) + pos;
   ray::raylet::TaskSpecification task_spec(std::string(data, taskSize));
   local_scheduler_submit_raylet(conn, execution_dependencies, task_spec);
 }
@@ -86,27 +74,33 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativeSubmitTask(
  * Method:    nativeGetTask
  * Signature: (J)[B
  */
-JNIEXPORT jbyteArray JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeGetTask(JNIEnv *env,
-                                                           jclass,
-                                                           jlong client) {
+JNIEXPORT jbyteArray JNICALL Java_org_ray_runtime_raylet_RayletClientImpl_nativeGetTask(
+    JNIEnv *env, jclass, jlong client) {
   auto conn = reinterpret_cast<LocalSchedulerConnection *>(client);
-  int64_t task_size = 0;
 
   // TODO: handle actor failure later
-  TaskSpec *spec = local_scheduler_get_task_raylet(conn, &task_size);
+  ray::raylet::TaskSpecification *spec = local_scheduler_get_task_raylet(conn);
+
+  // We serialize the task specification using flatbuffers and then parse the
+  // resulting string. This awkwardness is due to the fact that the Java
+  // implementation does not use the underlying C++ TaskSpecification class.
+  flatbuffers::FlatBufferBuilder fbb;
+  auto message = spec->ToFlatbuffer(fbb);
+  fbb.Finish(message);
+  auto task_message = flatbuffers::GetRoot<flatbuffers::String>(fbb.GetBufferPointer());
 
   jbyteArray result;
-  result = env->NewByteArray(task_size);
+  result = env->NewByteArray(task_message->size());
   if (result == nullptr) {
     return nullptr; /* out of memory error thrown */
   }
 
   // move from task spec structure to the java structure
-  env->SetByteArrayRegion(result, 0, task_size,
-                          reinterpret_cast<jbyte *>(spec));
+  env->SetByteArrayRegion(
+      result, 0, task_message->size(),
+      reinterpret_cast<jbyte *>(const_cast<char *>(task_message->data())));
 
-  TaskSpec_free(spec);
+  delete spec;
   return result;
 }
 
@@ -115,10 +109,8 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativeGetTask(JNIEnv *env,
  * Method:    nativeDestroy
  * Signature: (J)V
  */
-JNIEXPORT void JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeDestroy(JNIEnv *,
-                                                           jclass,
-                                                           jlong client) {
+JNIEXPORT void JNICALL Java_org_ray_runtime_raylet_RayletClientImpl_nativeDestroy(
+    JNIEnv *, jclass, jlong client) {
   auto conn = reinterpret_cast<LocalSchedulerConnection *>(client);
   local_scheduler_disconnect_client(conn);
   LocalSchedulerConnection_free(conn);
@@ -126,16 +118,13 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativeDestroy(JNIEnv *,
 
 /*
  * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativeReconstructObjects
- * Signature: (J[[BZ)V
+ * Method:    nativeFetchOrReconstruct
+ * Signature: (J[[BZ[B)I
  */
-JNIEXPORT void JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeReconstructObjects(
-    JNIEnv *env,
-    jclass,
-    jlong client,
-    jobjectArray objectIds,
-    jboolean fetchOnly) {
+JNIEXPORT jint JNICALL
+Java_org_ray_runtime_raylet_RayletClientImpl_nativeFetchOrReconstruct(
+    JNIEnv *env, jclass, jlong client, jobjectArray objectIds, jboolean fetchOnly,
+    jbyteArray currentTaskId) {
   std::vector<ObjectID> object_ids;
   auto len = env->GetArrayLength(objectIds);
   for (int i = 0; i < len; i++) {
@@ -145,8 +134,10 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativeReconstructObjects(
     object_ids.push_back(*object_id.PID);
     env->DeleteLocalRef(object_id_bytes);
   }
+  UniqueIdFromJByteArray current_task_id(env, currentTaskId);
   auto conn = reinterpret_cast<LocalSchedulerConnection *>(client);
-  local_scheduler_reconstruct_objects(conn, object_ids, fetchOnly);
+  return local_scheduler_fetch_or_reconstruct(conn, object_ids, fetchOnly,
+                                              *current_task_id.PID);
 }
 
 /*
@@ -154,30 +145,11 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativeReconstructObjects(
  * Method:    nativeNotifyUnblocked
  * Signature: (J)V
  */
-JNIEXPORT void JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativeNotifyUnblocked(
-    JNIEnv *,
-    jclass,
-    jlong client) {
-  auto conn = reinterpret_cast<LocalSchedulerConnection *>(client);
-  local_scheduler_notify_unblocked(conn);
-}
-
-/*
- * Class:     org_ray_runtime_raylet_RayletClientImpl
- * Method:    nativePutObject
- * Signature: (J[B[B)V
- */
-JNIEXPORT void JNICALL
-Java_org_ray_runtime_raylet_RayletClientImpl_nativePutObject(
-    JNIEnv *env,
-    jclass,
-    jlong client,
-    jbyteArray taskId,
-    jbyteArray objectId) {
-  UniqueIdFromJByteArray object_id(env, objectId), task_id(env, taskId);
+JNIEXPORT void JNICALL Java_org_ray_runtime_raylet_RayletClientImpl_nativeNotifyUnblocked(
+    JNIEnv *env, jclass, jlong client, jbyteArray currentTaskId) {
+  UniqueIdFromJByteArray current_task_id(env, currentTaskId);
   auto conn = reinterpret_cast<LocalSchedulerConnection *>(client);
-  local_scheduler_put_object(conn, *task_id.PID, *object_id.PID);
+  local_scheduler_notify_unblocked(conn, *current_task_id.PID);
 }
 
 /*
@@ -187,13 +159,8 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativePutObject(
  */
 JNIEXPORT jbooleanArray JNICALL
 Java_org_ray_runtime_raylet_RayletClientImpl_nativeWaitObject(
-    JNIEnv *env,
-    jclass,
-    jlong client,
-    jobjectArray objectIds,
-    jint numReturns,
-    jint timeoutMillis,
-    jboolean isWaitLocal) {
+    JNIEnv *env, jclass, jlong client, jobjectArray objectIds, jint numReturns,
+    jint timeoutMillis, jboolean isWaitLocal, jbyteArray currentTaskId) {
   std::vector<ObjectID> object_ids;
   auto len = env->GetArrayLength(objectIds);
   for (int i = 0; i < len; i++) {
@@ -203,13 +170,14 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativeWaitObject(
     object_ids.push_back(*object_id.PID);
     env->DeleteLocalRef(object_id_bytes);
   }
+  UniqueIdFromJByteArray current_task_id(env, currentTaskId);
 
   auto conn = reinterpret_cast<LocalSchedulerConnection *>(client);
 
   // Invoke wait.
   std::pair<std::vector<ObjectID>, std::vector<ObjectID>> result =
       local_scheduler_wait(conn, object_ids, numReturns, timeoutMillis,
-                           static_cast<bool>(isWaitLocal));
+                           static_cast<bool>(isWaitLocal), *current_task_id.PID);
 
   // Convert result to java object.
   jboolean put_value = true;
@@ -242,10 +210,7 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativeWaitObject(
  */
 JNIEXPORT jbyteArray JNICALL
 Java_org_ray_runtime_raylet_RayletClientImpl_nativeGenerateTaskId(
-    JNIEnv *env,
-    jclass,
-    jbyteArray driverId,
-    jbyteArray parentTaskId,
+    JNIEnv *env, jclass, jbyteArray driverId, jbyteArray parentTaskId,
     jint parent_task_counter) {
   UniqueIdFromJByteArray object_id1(env, driverId);
   ray::DriverID driver_id = *object_id1.PID;
@@ -259,8 +224,7 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativeGenerateTaskId(
   if (nullptr == result) {
     return nullptr;
   }
-  env->SetByteArrayRegion(result, 0, sizeof(TaskID),
-                          reinterpret_cast<jbyte *>(&task_id));
+  env->SetByteArrayRegion(result, 0, sizeof(TaskID), reinterpret_cast<jbyte *>(&task_id));
 
   return result;
 }
@@ -272,11 +236,7 @@ Java_org_ray_runtime_raylet_RayletClientImpl_nativeGenerateTaskId(
  */
 JNIEXPORT void JNICALL
 Java_org_ray_runtime_raylet_RayletClientImpl_nativeFreePlasmaObjects(
-    JNIEnv *env,
-    jclass,
-    jlong client,
-    jobjectArray objectIds,
-    jboolean localOnly) {
+    JNIEnv *env, jclass, jlong client, jobjectArray objectIds, jboolean localOnly) {
   std::vector<ObjectID> object_ids;
   auto len = env->GetArrayLength(objectIds);
   for (int i = 0; i < len; i++) {
diff --git a/src/ray/raylet/lib/java/org_ray_runtime_raylet_RayletClientImpl.h b/src/ray/raylet/lib/java/org_ray_runtime_raylet_RayletClientImpl.h
new file mode 100644
index 0000000000000..0d5d0b9cbb513
--- /dev/null
+++ b/src/ray/raylet/lib/java/org_ray_runtime_raylet_RayletClientImpl.h
@@ -0,0 +1,94 @@
+/* DO NOT EDIT THIS FILE - it is machine generated */
+#include <jni.h>
+/* Header for class org_ray_runtime_raylet_RayletClientImpl */
+
+#ifndef _Included_org_ray_runtime_raylet_RayletClientImpl
+#define _Included_org_ray_runtime_raylet_RayletClientImpl
+#ifdef __cplusplus
+extern "C" {
+#endif
+/*
+ * Class:     org_ray_runtime_raylet_RayletClientImpl
+ * Method:    nativeInit
+ * Signature: (Ljava/lang/String;[BZ[B)J
+ */
+JNIEXPORT jlong JNICALL Java_org_ray_runtime_raylet_RayletClientImpl_nativeInit(
+    JNIEnv *, jclass, jstring, jbyteArray, jboolean, jbyteArray);
+
+/*
+ * Class:     org_ray_runtime_raylet_RayletClientImpl
+ * Method:    nativeSubmitTask
+ * Signature: (J[BLjava/nio/ByteBuffer;II)V
+ */
+JNIEXPORT void JNICALL Java_org_ray_runtime_raylet_RayletClientImpl_nativeSubmitTask(
+    JNIEnv *, jclass, jlong, jbyteArray, jobject, jint, jint);
+
+/*
+ * Class:     org_ray_runtime_raylet_RayletClientImpl
+ * Method:    nativeGetTask
+ * Signature: (J)[B
+ */
+JNIEXPORT jbyteArray JNICALL
+Java_org_ray_runtime_raylet_RayletClientImpl_nativeGetTask(JNIEnv *, jclass, jlong);
+
+/*
+ * Class:     org_ray_runtime_raylet_RayletClientImpl
+ * Method:    nativeDestroy
+ * Signature: (J)V
+ */
+JNIEXPORT void JNICALL
+Java_org_ray_runtime_raylet_RayletClientImpl_nativeDestroy(JNIEnv *, jclass, jlong);
+
+/*
+ * Class:     org_ray_runtime_raylet_RayletClientImpl
+ * Method:    nativeFetchOrReconstruct
+ * Signature: (J[[BZ[B)I
+ */
+JNIEXPORT jint JNICALL
+Java_org_ray_runtime_raylet_RayletClientImpl_nativeFetchOrReconstruct(JNIEnv *, jclass,
+                                                                      jlong, jobjectArray,
+                                                                      jboolean,
+                                                                      jbyteArray);
+
+/*
+ * Class:     org_ray_runtime_raylet_RayletClientImpl
+ * Method:    nativeNotifyUnblocked
+ * Signature: (J)V
+ */
+JNIEXPORT void JNICALL Java_org_ray_runtime_raylet_RayletClientImpl_nativeNotifyUnblocked(
+    JNIEnv *, jclass, jlong, jbyteArray);
+
+/*
+ * Class:     org_ray_runtime_raylet_RayletClientImpl
+ * Method:    nativeWaitObject
+ * Signature: (J[[BIIZ)[Z
+ */
+JNIEXPORT jbooleanArray JNICALL
+Java_org_ray_runtime_raylet_RayletClientImpl_nativeWaitObject(JNIEnv *, jclass, jlong,
+                                                              jobjectArray, jint, jint,
+                                                              jboolean, jbyteArray);
+
+/*
+ * Class:     org_ray_runtime_raylet_RayletClientImpl
+ * Method:    nativeGenerateTaskId
+ * Signature: ([B[BI)[B
+ */
+JNIEXPORT jbyteArray JNICALL
+Java_org_ray_runtime_raylet_RayletClientImpl_nativeGenerateTaskId(JNIEnv *, jclass,
+                                                                  jbyteArray, jbyteArray,
+                                                                  jint);
+
+/*
+ * Class:     org_ray_runtime_raylet_RayletClientImpl
+ * Method:    nativeFreePlasmaObjects
+ * Signature: (J[[BZ)V
+ */
+JNIEXPORT void JNICALL
+Java_org_ray_runtime_raylet_RayletClientImpl_nativeFreePlasmaObjects(JNIEnv *, jclass,
+                                                                     jlong, jobjectArray,
+                                                                     jboolean);
+
+#ifdef __cplusplus
+}
+#endif
+#endif
diff --git a/src/ray/raylet/lib/python/common_extension.cc b/src/ray/raylet/lib/python/common_extension.cc
new file mode 100644
index 0000000000000..f4979620c3195
--- /dev/null
+++ b/src/ray/raylet/lib/python/common_extension.cc
@@ -0,0 +1,774 @@
+#include <Python.h>
+#include "bytesobject.h"
+#include "node.h"
+
+// Don't use the deprecated Numpy functions.
+#define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
+
+#include <numpy/arrayobject.h>
+
+#include "common_extension.h"
+#include "ray/common/common_protocol.h"
+#include "ray/id.h"
+#include "ray/ray_config.h"
+#include "ray/raylet/task.h"
+#include "ray/raylet/task_execution_spec.h"
+#include "ray/raylet/task_spec.h"
+#include "ray/util/logging.h"
+
+#include <string>
+
+#if PY_MAJOR_VERSION >= 3
+#define PyInt_Check PyLong_Check
+#endif
+
+// TODO(rkn): Remove this later.
+using ray::ObjectID;
+using ray::ActorID;
+using ray::ActorHandleID;
+using ray::UniqueID;
+using ray::FunctionID;
+using ray::TaskID;
+
+PyObject *CommonError;
+
+/* Initialize pickle module. */
+
+PyObject *pickle_module = NULL;
+PyObject *pickle_loads = NULL;
+PyObject *pickle_dumps = NULL;
+PyObject *pickle_protocol = NULL;
+
+int init_numpy_module(void) {
+  import_array1(-1);
+  return 0;
+}
+
+void init_pickle_module(void) {
+#if PY_MAJOR_VERSION >= 3
+  pickle_module = PyImport_ImportModule("pickle");
+#else
+  pickle_module = PyImport_ImportModuleNoBlock("cPickle");
+#endif
+  RAY_CHECK(pickle_module != NULL);
+  RAY_CHECK(PyObject_HasAttrString(pickle_module, "loads"));
+  RAY_CHECK(PyObject_HasAttrString(pickle_module, "dumps"));
+  RAY_CHECK(PyObject_HasAttrString(pickle_module, "HIGHEST_PROTOCOL"));
+  pickle_loads = PyUnicode_FromString("loads");
+  pickle_dumps = PyUnicode_FromString("dumps");
+  pickle_protocol = PyObject_GetAttrString(pickle_module, "HIGHEST_PROTOCOL");
+  RAY_CHECK(pickle_protocol != NULL);
+}
+
+TaskBuilder *g_task_builder = NULL;
+
+/* Define the PyObjectID class. */
+
+int PyStringToUniqueID(PyObject *object, ObjectID *object_id) {
+  if (PyBytes_Check(object)) {
+    std::memcpy(object_id->mutable_data(), PyBytes_AsString(object), sizeof(*object_id));
+    return 1;
+  } else {
+    PyErr_SetString(PyExc_TypeError, "must be a 20 character string");
+    return 0;
+  }
+}
+
+int PyObjectToUniqueID(PyObject *object, ObjectID *objectid) {
+  if (PyObject_IsInstance(object, (PyObject *)&PyObjectIDType)) {
+    *objectid = ((PyObjectID *)object)->object_id;
+    return 1;
+  } else {
+    PyErr_SetString(PyExc_TypeError, "must be an ObjectID");
+    return 0;
+  }
+}
+
+static int PyObjectID_init(PyObjectID *self, PyObject *args, PyObject *kwds) {
+  const char *data;
+  int size;
+  if (!PyArg_ParseTuple(args, "s#", &data, &size)) {
+    return -1;
+  }
+  if (size != sizeof(ObjectID)) {
+    PyErr_SetString(CommonError, "ObjectID: object id string needs to have length 20");
+    return -1;
+  }
+  std::memcpy(self->object_id.mutable_data(), data, sizeof(self->object_id));
+  return 0;
+}
+
+/* Create a PyObjectID from C. */
+PyObject *PyObjectID_make(ObjectID object_id) {
+  PyObjectID *result = PyObject_New(PyObjectID, &PyObjectIDType);
+  result = (PyObjectID *)PyObject_Init((PyObject *)result, &PyObjectIDType);
+  result->object_id = object_id;
+  return (PyObject *)result;
+}
+
+TaskSpec *TaskSpec_copy(TaskSpec *spec, int64_t task_spec_size) {
+  TaskSpec *copy = (TaskSpec *)malloc(task_spec_size);
+  memcpy(copy, spec, task_spec_size);
+  return copy;
+}
+
+/**
+ * Convert a string to a Ray task specification Python object.
+ *
+ * This is called from Python like
+ *
+ * task = local_scheduler.task_from_string("...")
+ *
+ * @param task_string String representation of the task specification.
+ * @return Python task specification object.
+ */
+PyObject *PyTask_from_string(PyObject *self, PyObject *args) {
+  const char *data;
+  int size;
+  if (!PyArg_ParseTuple(args, "s#", &data, &size)) {
+    return NULL;
+  }
+  PyTask *result = PyObject_New(PyTask, &PyTaskType);
+  result = (PyTask *)PyObject_Init((PyObject *)result, &PyTaskType);
+  result->task_spec = new ray::raylet::TaskSpecification(std::string(data, size));
+  /* The created task does not include any execution dependencies. */
+  result->execution_dependencies = new std::vector<ObjectID>();
+  /* TODO(pcm): Use flatbuffers validation here. */
+  return (PyObject *)result;
+}
+
+/**
+ * Convert a Ray task specification Python object to a string.
+ *
+ * This is called from Python like
+ *
+ * s = local_scheduler.task_to_string(task)
+ *
+ * @param task Ray task specification Python object.
+ * @return String representing the task specification.
+ */
+PyObject *PyTask_to_string(PyObject *self, PyObject *args) {
+  PyObject *arg;
+  if (!PyArg_ParseTuple(args, "O", &arg)) {
+    return NULL;
+  }
+  PyTask *task = (PyTask *)arg;
+  flatbuffers::FlatBufferBuilder fbb;
+  auto task_spec_string = task->task_spec->ToFlatbuffer(fbb);
+  fbb.Finish(task_spec_string);
+  return PyBytes_FromStringAndSize((char *)fbb.GetBufferPointer(), fbb.GetSize());
+}
+
+static PyObject *PyObjectID_id(PyObject *self) {
+  PyObjectID *s = (PyObjectID *)self;
+  return PyBytes_FromStringAndSize((const char *)s->object_id.data(),
+                                   sizeof(s->object_id));
+}
+
+static PyObject *PyObjectID_hex(PyObject *self) {
+  PyObjectID *s = (PyObjectID *)self;
+  std::string hex_id = s->object_id.hex();
+#if PY_MAJOR_VERSION >= 3
+  PyObject *result = PyUnicode_FromStringAndSize(hex_id.data(), hex_id.size());
+#else
+  PyObject *result = PyBytes_FromStringAndSize(hex_id.data(), hex_id.size());
+#endif
+  return result;
+}
+
+static PyObject *PyObjectID_is_nil(PyObject *self) {
+  ObjectID object_id;
+  PyObjectToUniqueID(self, &object_id);
+  if (object_id.is_nil()) {
+    Py_RETURN_TRUE;
+  } else {
+    Py_RETURN_FALSE;
+  }
+}
+
+static PyObject *PyObjectID_richcompare(PyObjectID *self, PyObject *other, int op) {
+  PyObject *result = NULL;
+  if (Py_TYPE(self)->tp_richcompare != Py_TYPE(other)->tp_richcompare) {
+    result = Py_NotImplemented;
+  } else {
+    PyObjectID *other_id = (PyObjectID *)other;
+    switch (op) {
+    case Py_LT:
+      result = Py_NotImplemented;
+      break;
+    case Py_LE:
+      result = Py_NotImplemented;
+      break;
+    case Py_EQ:
+      result = self->object_id == other_id->object_id ? Py_True : Py_False;
+      break;
+    case Py_NE:
+      result = !(self->object_id == other_id->object_id) ? Py_True : Py_False;
+      break;
+    case Py_GT:
+      result = Py_NotImplemented;
+      break;
+    case Py_GE:
+      result = Py_NotImplemented;
+      break;
+    }
+  }
+  Py_XINCREF(result);
+  return result;
+}
+
+static PyObject *PyObjectID_redis_shard_hash(PyObjectID *self) {
+  // NOTE: The hash function used here must match the one in GetRedisContext in
+  // src/ray/gcs/tables.h. Changes to the hash function should only be made
+  // through std::hash in src/common/common.h
+  std::hash<ray::UniqueID> hash;
+  return PyLong_FromSize_t(hash(self->object_id));
+}
+
+static long PyObjectID_hash(PyObjectID *self) {
+  // TODO(pcm): Replace this with a faster hash function. This currently
+  // creates a tuple of length 20 and hashes it, which is slow
+  PyObject *tuple = PyTuple_New(kUniqueIDSize);
+  for (int i = 0; i < kUniqueIDSize; ++i) {
+    PyTuple_SetItem(tuple, i, PyLong_FromLong(self->object_id.data()[i]));
+  }
+  long hash = PyObject_Hash(tuple);
+  Py_XDECREF(tuple);
+  return hash;
+}
+
+static PyObject *PyObjectID_repr(PyObjectID *self) {
+  std::string repr = "ObjectID(" + self->object_id.hex() + ")";
+  PyObject *result = PyUnicode_FromString(repr.c_str());
+  return result;
+}
+
+static PyObject *PyObjectID___reduce__(PyObjectID *self) {
+  PyErr_SetString(CommonError, "ObjectID objects cannot be serialized.");
+  return NULL;
+}
+
+static PyMethodDef PyObjectID_methods[] = {
+    {"id", (PyCFunction)PyObjectID_id, METH_NOARGS,
+     "Return the hash associated with this ObjectID"},
+    {"redis_shard_hash", (PyCFunction)PyObjectID_redis_shard_hash, METH_NOARGS,
+     "Return the redis shard that this ObjectID is associated with"},
+    {"hex", (PyCFunction)PyObjectID_hex, METH_NOARGS,
+     "Return the object ID as a string in hex."},
+    {"is_nil", (PyCFunction)PyObjectID_is_nil, METH_NOARGS,
+     "Return whether the ObjectID is nil"},
+    {"__reduce__", (PyCFunction)PyObjectID___reduce__, METH_NOARGS,
+     "Say how to pickle this ObjectID. This raises an exception to prevent"
+     "object IDs from being serialized."},
+    {NULL} /* Sentinel */
+};
+
+static PyMemberDef PyObjectID_members[] = {
+    {NULL} /* Sentinel */
+};
+
+PyTypeObject PyObjectIDType = {
+    PyVarObject_HEAD_INIT(NULL, 0)       /* ob_size */
+    "common.ObjectID",                   /* tp_name */
+    sizeof(PyObjectID),                  /* tp_basicsize */
+    0,                                   /* tp_itemsize */
+    0,                                   /* tp_dealloc */
+    0,                                   /* tp_print */
+    0,                                   /* tp_getattr */
+    0,                                   /* tp_setattr */
+    0,                                   /* tp_compare */
+    (reprfunc)PyObjectID_repr,           /* tp_repr */
+    0,                                   /* tp_as_number */
+    0,                                   /* tp_as_sequence */
+    0,                                   /* tp_as_mapping */
+    (hashfunc)PyObjectID_hash,           /* tp_hash */
+    0,                                   /* tp_call */
+    0,                                   /* tp_str */
+    0,                                   /* tp_getattro */
+    0,                                   /* tp_setattro */
+    0,                                   /* tp_as_buffer */
+    Py_TPFLAGS_DEFAULT,                  /* tp_flags */
+    "ObjectID object",                   /* tp_doc */
+    0,                                   /* tp_traverse */
+    0,                                   /* tp_clear */
+    (richcmpfunc)PyObjectID_richcompare, /* tp_richcompare */
+    0,                                   /* tp_weaklistoffset */
+    0,                                   /* tp_iter */
+    0,                                   /* tp_iternext */
+    PyObjectID_methods,                  /* tp_methods */
+    PyObjectID_members,                  /* tp_members */
+    0,                                   /* tp_getset */
+    0,                                   /* tp_base */
+    0,                                   /* tp_dict */
+    0,                                   /* tp_descr_get */
+    0,                                   /* tp_descr_set */
+    0,                                   /* tp_dictoffset */
+    (initproc)PyObjectID_init,           /* tp_init */
+    0,                                   /* tp_alloc */
+    PyType_GenericNew,                   /* tp_new */
+};
+
+// Define the PyTask class.
+
+int resource_map_from_python_dict(PyObject *resource_map,
+                                  std::unordered_map<std::string, double> &out) {
+  RAY_CHECK(out.size() == 0);
+
+  PyObject *key, *value;
+  Py_ssize_t position = 0;
+  if (!PyDict_Check(resource_map)) {
+    PyErr_SetString(PyExc_TypeError, "resource_map must be a dictionary");
+    return -1;
+  }
+
+  while (PyDict_Next(resource_map, &position, &key, &value)) {
+#if PY_MAJOR_VERSION >= 3
+    if (!PyUnicode_Check(key)) {
+      PyErr_SetString(PyExc_TypeError, "the keys in resource_map must be strings");
+      return -1;
+    }
+#else
+    if (!PyBytes_Check(key)) {
+      PyErr_SetString(PyExc_TypeError, "the keys in resource_map must be strings");
+      return -1;
+    }
+#endif
+
+    // Check that the resource quantities are numbers.
+    if (!(PyFloat_Check(value) || PyInt_Check(value) || PyLong_Check(value))) {
+      PyErr_SetString(PyExc_TypeError, "the values in resource_map must be floats");
+      return -1;
+    }
+    // Handle the case where the key is a bytes object and the case where it
+    // is a unicode object.
+    std::string resource_name;
+    if (PyUnicode_Check(key)) {
+      PyObject *ascii_key = PyUnicode_AsASCIIString(key);
+      resource_name = std::string(PyBytes_AsString(ascii_key), PyBytes_Size(ascii_key));
+      Py_DECREF(ascii_key);
+    } else {
+      resource_name = std::string(PyBytes_AsString(key), PyBytes_Size(key));
+    }
+    out[resource_name] = PyFloat_AsDouble(value);
+  }
+  return 0;
+}
+
+static int PyTask_init(PyTask *self, PyObject *args, PyObject *kwds) {
+  // ID of the driver that this task originates from.
+  UniqueID driver_id;
+  // ID of the actor this task should run on.
+  UniqueID actor_id = ActorID::nil();
+  // ID of the actor handle used to submit this task.
+  UniqueID actor_handle_id = ActorHandleID::nil();
+  // How many tasks have been launched on the actor so far?
+  int actor_counter = 0;
+  // ID of the function this task executes.
+  FunctionID function_id;
+  // Arguments of the task (can be PyObjectIDs or Python values).
+  PyObject *arguments;
+  // Number of return values of this task.
+  int num_returns;
+  // The ID of the task that called this task.
+  TaskID parent_task_id;
+  // The number of tasks that the parent task has called prior to this one.
+  int parent_counter;
+  // The actor creation ID.
+  ActorID actor_creation_id = ActorID::nil();
+  // The dummy object for the actor creation task (if this is an actor method).
+  ObjectID actor_creation_dummy_object_id = ObjectID::nil();
+  // Arguments of the task that are execution-dependent. These must be
+  // PyObjectIDs).
+  PyObject *execution_arguments = nullptr;
+  // Dictionary of resource requirements for this task.
+  PyObject *resource_map = nullptr;
+  // Dictionary of required placement resources for this task.
+  PyObject *placement_resource_map = nullptr;
+  if (!PyArg_ParseTuple(args, "O&O&OiO&i|O&O&O&O&iOOO", &PyObjectToUniqueID, &driver_id,
+                        &PyObjectToUniqueID, &function_id, &arguments, &num_returns,
+                        &PyObjectToUniqueID, &parent_task_id, &parent_counter,
+                        &PyObjectToUniqueID, &actor_creation_id, &PyObjectToUniqueID,
+                        &actor_creation_dummy_object_id, &PyObjectToUniqueID, &actor_id,
+                        &PyObjectToUniqueID, &actor_handle_id, &actor_counter,
+                        &execution_arguments, &resource_map, &placement_resource_map)) {
+    return -1;
+  }
+
+  // Parse the resource map.
+  std::unordered_map<std::string, double> required_resources;
+  std::unordered_map<std::string, double> required_placement_resources;
+
+  if (resource_map != nullptr) {
+    if (resource_map_from_python_dict(resource_map, required_resources) != 0) {
+      return -1;
+    }
+  }
+
+  if (required_resources.count("CPU") == 0) {
+    required_resources["CPU"] = 1.0;
+  }
+
+  if (placement_resource_map != nullptr) {
+    if (resource_map_from_python_dict(placement_resource_map,
+                                      required_placement_resources) != 0) {
+      return -1;
+    }
+  }
+
+  Py_ssize_t num_args = PyList_Size(arguments);
+
+  self->task_spec = nullptr;
+
+  // Create the task spec.
+  // Parse the arguments from the list.
+  std::vector<std::shared_ptr<ray::raylet::TaskArgument>> task_args;
+  for (Py_ssize_t i = 0; i < num_args; ++i) {
+    PyObject *arg = PyList_GetItem(arguments, i);
+    if (PyObject_IsInstance(arg, reinterpret_cast<PyObject *>(&PyObjectIDType))) {
+      std::vector<ObjectID> references = {reinterpret_cast<PyObjectID *>(arg)->object_id};
+      task_args.push_back(
+          std::make_shared<ray::raylet::TaskArgumentByReference>(references));
+    } else {
+      PyObject *data = PyObject_CallMethodObjArgs(pickle_module, pickle_dumps, arg,
+                                                  pickle_protocol, NULL);
+      task_args.push_back(std::make_shared<ray::raylet::TaskArgumentByValue>(
+          reinterpret_cast<uint8_t *>(PyBytes_AsString(data)), PyBytes_Size(data)));
+      Py_DECREF(data);
+    }
+  }
+
+  self->task_spec = new ray::raylet::TaskSpecification(
+      driver_id, parent_task_id, parent_counter, actor_creation_id,
+      actor_creation_dummy_object_id, actor_id, actor_handle_id, actor_counter,
+      function_id, task_args, num_returns, required_resources,
+      required_placement_resources, Language::PYTHON);
+
+  /* Set the task's execution dependencies. */
+  self->execution_dependencies = new std::vector<ObjectID>();
+  if (execution_arguments != NULL) {
+    Py_ssize_t num_execution_args = PyList_Size(execution_arguments);
+    for (Py_ssize_t i = 0; i < num_execution_args; ++i) {
+      PyObject *execution_arg = PyList_GetItem(execution_arguments, i);
+      if (!PyObject_IsInstance(execution_arg, (PyObject *)&PyObjectIDType)) {
+        PyErr_SetString(PyExc_TypeError, "Execution arguments must be an ObjectID.");
+        return -1;
+      }
+      self->execution_dependencies->push_back(((PyObjectID *)execution_arg)->object_id);
+    }
+  }
+
+  return 0;
+}
+
+static void PyTask_dealloc(PyTask *self) {
+  delete self->task_spec;
+  delete self->execution_dependencies;
+  Py_TYPE(self)->tp_free(reinterpret_cast<PyObject *>(self));
+}
+
+static PyObject *PyTask_function_id(PyTask *self) {
+  FunctionID function_id = self->task_spec->FunctionId();
+  return PyObjectID_make(function_id);
+}
+
+static PyObject *PyTask_actor_id(PyTask *self) {
+  ActorID actor_id = self->task_spec->ActorId();
+  return PyObjectID_make(actor_id);
+}
+
+static PyObject *PyTask_actor_counter(PyTask *self) {
+  int64_t actor_counter = self->task_spec->ActorCounter();
+  return PyLong_FromLongLong(actor_counter);
+}
+
+static PyObject *PyTask_driver_id(PyTask *self) {
+  UniqueID driver_id = self->task_spec->DriverId();
+  return PyObjectID_make(driver_id);
+}
+
+static PyObject *PyTask_task_id(PyTask *self) {
+  TaskID task_id = self->task_spec->TaskId();
+  return PyObjectID_make(task_id);
+}
+
+static PyObject *PyTask_parent_task_id(PyTask *self) {
+  TaskID task_id = self->task_spec->ParentTaskId();
+  return PyObjectID_make(task_id);
+}
+
+static PyObject *PyTask_parent_counter(PyTask *self) {
+  int64_t parent_counter = self->task_spec->ParentCounter();
+  return PyLong_FromLongLong(parent_counter);
+}
+
+static PyObject *PyTask_arguments(PyTask *self) {
+  ray::raylet::TaskSpecification *task_spec = self->task_spec;
+
+  int64_t num_args = self->task_spec->NumArgs();
+
+  PyObject *arg_list = PyList_New((Py_ssize_t)num_args);
+  for (int i = 0; i < num_args; ++i) {
+    int count = task_spec->ArgIdCount(i);
+
+    if (count > 0) {
+      assert(count == 1);
+
+      const ObjectID object_id = task_spec->ArgId(i, 0);
+
+      PyList_SetItem(arg_list, i, PyObjectID_make(object_id));
+    } else {
+      RAY_CHECK(pickle_module != NULL);
+      RAY_CHECK(pickle_loads != NULL);
+
+      const uint8_t *arg_val = task_spec->ArgVal(i);
+      int64_t arg_length = task_spec->ArgValLength(i);
+
+      PyObject *str = PyBytes_FromStringAndSize(reinterpret_cast<const char *>(arg_val),
+                                                static_cast<Py_ssize_t>(arg_length));
+      PyObject *val = PyObject_CallMethodObjArgs(pickle_module, pickle_loads, str, NULL);
+      Py_XDECREF(str);
+      PyList_SetItem(arg_list, i, val);
+    }
+  }
+  return arg_list;
+}
+
+static PyObject *PyTask_actor_creation_id(PyTask *self) {
+  ActorID actor_creation_id = self->task_spec->ActorCreationId();
+  return PyObjectID_make(actor_creation_id);
+}
+
+static PyObject *PyTask_actor_creation_dummy_object_id(PyTask *self) {
+  ObjectID actor_creation_dummy_object_id = self->task_spec->ActorCreationDummyObjectId();
+  return PyObjectID_make(actor_creation_dummy_object_id);
+}
+
+static PyObject *PyTask_required_resources(PyTask *self) {
+  PyObject *required_resources = PyDict_New();
+
+  std::unordered_map<std::string, double> resource_map =
+      self->task_spec->GetRequiredResources().GetResourceMap();
+
+  for (auto const &resource_pair : resource_map) {
+    std::string resource_name = resource_pair.first;
+#if PY_MAJOR_VERSION >= 3
+    PyObject *key =
+        PyUnicode_FromStringAndSize(resource_name.data(), resource_name.size());
+#else
+    PyObject *key = PyBytes_FromStringAndSize(resource_name.data(), resource_name.size());
+#endif
+    PyObject *value = PyFloat_FromDouble(resource_pair.second);
+    PyDict_SetItem(required_resources, key, value);
+    Py_DECREF(key);
+    Py_DECREF(value);
+  }
+  return required_resources;
+}
+
+static PyObject *PyTask_returns(PyTask *self) {
+  ray::raylet::TaskSpecification *task_spec = self->task_spec;
+
+  int64_t num_returns = task_spec->NumReturns();
+
+  PyObject *return_id_list = PyList_New((Py_ssize_t)num_returns);
+  for (int i = 0; i < num_returns; ++i) {
+    ObjectID object_id = task_spec->ReturnId(i);
+    PyList_SetItem(return_id_list, i, PyObjectID_make(object_id));
+  }
+  return return_id_list;
+}
+
+static PyObject *PyTask_to_serialized_flatbuf(PyTask *self) {
+  const std::vector<ObjectID> execution_dependencies(*self->execution_dependencies);
+  auto const execution_spec =
+      ray::raylet::TaskExecutionSpecification(std::move(execution_dependencies));
+  auto const task = ray::raylet::Task(execution_spec, *self->task_spec);
+
+  flatbuffers::FlatBufferBuilder fbb;
+  auto task_flatbuffer = task.ToFlatbuffer(fbb);
+  fbb.Finish(task_flatbuffer);
+
+  return PyBytes_FromStringAndSize(reinterpret_cast<char *>(fbb.GetBufferPointer()),
+                                   fbb.GetSize());
+}
+
+static PyMethodDef PyTask_methods[] = {
+    {"function_id", (PyCFunction)PyTask_function_id, METH_NOARGS,
+     "Return the function ID for this task."},
+    {"parent_task_id", (PyCFunction)PyTask_parent_task_id, METH_NOARGS,
+     "Return the task ID of the parent task."},
+    {"parent_counter", (PyCFunction)PyTask_parent_counter, METH_NOARGS,
+     "Return the parent counter of this task."},
+    {"actor_id", (PyCFunction)PyTask_actor_id, METH_NOARGS,
+     "Return the actor ID for this task."},
+    {"actor_counter", (PyCFunction)PyTask_actor_counter, METH_NOARGS,
+     "Return the actor counter for this task."},
+    {"driver_id", (PyCFunction)PyTask_driver_id, METH_NOARGS,
+     "Return the driver ID for this task."},
+    {"task_id", (PyCFunction)PyTask_task_id, METH_NOARGS,
+     "Return the task ID for this task."},
+    {"arguments", (PyCFunction)PyTask_arguments, METH_NOARGS,
+     "Return the arguments for the task."},
+    {"actor_creation_id", (PyCFunction)PyTask_actor_creation_id, METH_NOARGS,
+     "Return the actor creation ID for the task."},
+    {"actor_creation_dummy_object_id", (PyCFunction)PyTask_actor_creation_dummy_object_id,
+     METH_NOARGS, "Return the actor creation dummy object ID for the task."},
+    {"required_resources", (PyCFunction)PyTask_required_resources, METH_NOARGS,
+     "Return the resource vector of the task."},
+    {"returns", (PyCFunction)PyTask_returns, METH_NOARGS,
+     "Return the object IDs for the return values of the task."},
+    {"_serialized_raylet_task", (PyCFunction)PyTask_to_serialized_flatbuf, METH_NOARGS,
+     "This is a hack used to create a serialized flatbuffer object for the "
+     "driver task. We're doing this because creating the flatbuffer object in "
+     "Python didn't seem to work."},
+    {NULL} /* Sentinel */
+};
+
+PyTypeObject PyTaskType = {
+    PyVarObject_HEAD_INIT(NULL, 0) /* ob_size */
+    "task.Task",                   /* tp_name */
+    sizeof(PyTask),                /* tp_basicsize */
+    0,                             /* tp_itemsize */
+    (destructor)PyTask_dealloc,    /* tp_dealloc */
+    0,                             /* tp_print */
+    0,                             /* tp_getattr */
+    0,                             /* tp_setattr */
+    0,                             /* tp_compare */
+    0,                             /* tp_repr */
+    0,                             /* tp_as_number */
+    0,                             /* tp_as_sequence */
+    0,                             /* tp_as_mapping */
+    0,                             /* tp_hash */
+    0,                             /* tp_call */
+    0,                             /* tp_str */
+    0,                             /* tp_getattro */
+    0,                             /* tp_setattro */
+    0,                             /* tp_as_buffer */
+    Py_TPFLAGS_DEFAULT,            /* tp_flags */
+    "Task object",                 /* tp_doc */
+    0,                             /* tp_traverse */
+    0,                             /* tp_clear */
+    0,                             /* tp_richcompare */
+    0,                             /* tp_weaklistoffset */
+    0,                             /* tp_iter */
+    0,                             /* tp_iternext */
+    PyTask_methods,                /* tp_methods */
+    0,                             /* tp_members */
+    0,                             /* tp_getset */
+    0,                             /* tp_base */
+    0,                             /* tp_dict */
+    0,                             /* tp_descr_get */
+    0,                             /* tp_descr_set */
+    0,                             /* tp_dictoffset */
+    (initproc)PyTask_init,         /* tp_init */
+    0,                             /* tp_alloc */
+    PyType_GenericNew,             /* tp_new */
+};
+
+// Create a PyTask from a C struct. The resulting PyTask takes ownership of the
+// TaskSpec and will deallocate the TaskSpec in the PyTask destructor.
+PyObject *PyTask_make(ray::raylet::TaskSpecification *task_spec) {
+  PyTask *result = PyObject_New(PyTask, &PyTaskType);
+  result = (PyTask *)PyObject_Init((PyObject *)result, &PyTaskType);
+  result->task_spec = task_spec;
+  // The created task does not include any execution dependencies.
+  result->execution_dependencies = new std::vector<ObjectID>();
+  return (PyObject *)result;
+}
+
+/* Define the methods for the module. */
+
+/**
+ * This method checks if a Python object is sufficiently simple that it can be
+ * serialized and passed by value as an argument to a task (without being put in
+ * the object store). The details of which objects are sufficiently simple are
+ * defined by this method and are not particularly important. But for
+ * performance reasons, it is better to place "small" objects in the task itself
+ * and "large" objects in the object store.
+ *
+ * @param value The Python object in question.
+ * @param num_elements_contained If this method returns 1, then the number of
+ *        objects recursively contained within this object will be added to the
+ *        value at this address. This is used to make sure that we do not
+ *        serialize objects that are too large.
+ * @return False if the object cannot be serialized in the task and true if it
+ *         can.
+ */
+bool is_simple_value(PyObject *value, int *num_elements_contained) {
+  *num_elements_contained += 1;
+  if (*num_elements_contained >= RayConfig::instance().num_elements_limit()) {
+    return false;
+  }
+  if (PyInt_Check(value) || PyLong_Check(value) || value == Py_False ||
+      value == Py_True || PyFloat_Check(value) || value == Py_None) {
+    return true;
+  }
+  if (PyBytes_CheckExact(value)) {
+    *num_elements_contained += PyBytes_Size(value);
+    return (*num_elements_contained < RayConfig::instance().num_elements_limit());
+  }
+  if (PyUnicode_CheckExact(value)) {
+    *num_elements_contained += PyUnicode_GET_SIZE(value);
+    return (*num_elements_contained < RayConfig::instance().num_elements_limit());
+  }
+  if (PyList_CheckExact(value) &&
+      PyList_Size(value) < RayConfig::instance().size_limit()) {
+    for (Py_ssize_t i = 0; i < PyList_Size(value); ++i) {
+      if (!is_simple_value(PyList_GetItem(value, i), num_elements_contained)) {
+        return false;
+      }
+    }
+    return (*num_elements_contained < RayConfig::instance().num_elements_limit());
+  }
+  if (PyDict_CheckExact(value) &&
+      PyDict_Size(value) < RayConfig::instance().size_limit()) {
+    PyObject *key, *val;
+    Py_ssize_t pos = 0;
+    while (PyDict_Next(value, &pos, &key, &val)) {
+      if (!is_simple_value(key, num_elements_contained) ||
+          !is_simple_value(val, num_elements_contained)) {
+        return false;
+      }
+    }
+    return (*num_elements_contained < RayConfig::instance().num_elements_limit());
+  }
+  if (PyTuple_CheckExact(value) &&
+      PyTuple_Size(value) < RayConfig::instance().size_limit()) {
+    for (Py_ssize_t i = 0; i < PyTuple_Size(value); ++i) {
+      if (!is_simple_value(PyTuple_GetItem(value, i), num_elements_contained)) {
+        return false;
+      }
+    }
+    return (*num_elements_contained < RayConfig::instance().num_elements_limit());
+  }
+  if (PyArray_CheckExact(value)) {
+    PyArrayObject *array = reinterpret_cast<PyArrayObject *>(value);
+    if (PyArray_TYPE(array) == NPY_OBJECT) {
+      return false;
+    }
+    *num_elements_contained += PyArray_NBYTES(array);
+    return (*num_elements_contained < RayConfig::instance().num_elements_limit());
+  }
+  return false;
+}
+
+PyObject *check_simple_value(PyObject *self, PyObject *args) {
+  PyObject *value;
+  if (!PyArg_ParseTuple(args, "O", &value)) {
+    return NULL;
+  }
+  int num_elements_contained = 0;
+  if (is_simple_value(value, &num_elements_contained)) {
+    Py_RETURN_TRUE;
+  }
+  Py_RETURN_FALSE;
+}
+
+PyObject *compute_task_id(PyObject *self, PyObject *args) {
+  ObjectID object_id;
+  if (!PyArg_ParseTuple(args, "O&", &PyObjectToUniqueID, &object_id)) {
+    return NULL;
+  }
+  TaskID task_id = ray::ComputeTaskId(object_id);
+  return PyObjectID_make(task_id);
+}
diff --git a/src/common/lib/python/common_extension.h b/src/ray/raylet/lib/python/common_extension.h
similarity index 86%
rename from src/common/lib/python/common_extension.h
rename to src/ray/raylet/lib/python/common_extension.h
index 0172135f19ac1..4dc346b96819e 100644
--- a/src/common/lib/python/common_extension.h
+++ b/src/ray/raylet/lib/python/common_extension.h
@@ -7,7 +7,6 @@
 #include "marshal.h"
 #include "structmember.h"
 
-#include "common.h"
 #include "ray/raylet/task_spec.h"
 
 typedef char TaskSpec;
@@ -23,9 +22,6 @@ typedef struct {
 
 typedef struct {
   PyObject_HEAD
-  int64_t size;
-  // The task spec to use in the non-raylet case.
-  TaskSpec *spec;
   // The task spec to use in the raylet case.
   ray::raylet::TaskSpecification *task_spec;
   std::vector<ray::ObjectID> *execution_dependencies;
@@ -36,8 +32,6 @@ extern PyTypeObject PyObjectIDType;
 
 extern PyTypeObject PyTaskType;
 
-bool use_raylet(PyTask *task);
-
 /* Python module for pickling. */
 extern PyObject *pickle_module;
 extern PyObject *pickle_dumps;
@@ -61,6 +55,6 @@ PyObject *compute_task_id(PyObject *self, PyObject *args);
 PyObject *PyTask_to_string(PyObject *, PyObject *args);
 PyObject *PyTask_from_string(PyObject *, PyObject *args);
 
-PyObject *PyTask_make(TaskSpec *task_spec, int64_t task_size);
+PyObject *PyTask_make(ray::raylet::TaskSpecification *task_spec);
 
 #endif /* COMMON_EXTENSION_H */
diff --git a/src/common/lib/python/config_extension.cc b/src/ray/raylet/lib/python/config_extension.cc
similarity index 63%
rename from src/common/lib/python/config_extension.cc
rename to src/ray/raylet/lib/python/config_extension.cc
index 8002138dccec7..06b0a032ad435 100644
--- a/src/common/lib/python/config_extension.cc
+++ b/src/ray/raylet/lib/python/config_extension.cc
@@ -1,13 +1,13 @@
 #include <Python.h>
 #include "bytesobject.h"
 
-#include "state/ray_config.h"
 #include "config_extension.h"
+#include "ray/ray_config.h"
 
 PyObject *PyRayConfig_make() {
   PyRayConfig *result = PyObject_New(PyRayConfig, &PyRayConfigType);
-  result = (PyRayConfig *) PyObject_Init((PyObject *) result, &PyRayConfigType);
-  return (PyObject *) result;
+  result = (PyRayConfig *)PyObject_Init((PyObject *)result, &PyRayConfigType);
+  return (PyObject *)result;
 }
 
 PyObject *PyRayConfig_ray_protocol_version(PyObject *self) {
@@ -15,8 +15,7 @@ PyObject *PyRayConfig_ray_protocol_version(PyObject *self) {
 }
 
 PyObject *PyRayConfig_heartbeat_timeout_milliseconds(PyObject *self) {
-  return PyLong_FromLongLong(
-      RayConfig::instance().heartbeat_timeout_milliseconds());
+  return PyLong_FromLongLong(RayConfig::instance().heartbeat_timeout_milliseconds());
 }
 
 PyObject *PyRayConfig_num_heartbeats_timeout(PyObject *self) {
@@ -44,12 +43,10 @@ PyObject *PyRayConfig_num_connect_attempts(PyObject *self) {
 }
 
 PyObject *PyRayConfig_connect_timeout_milliseconds(PyObject *self) {
-  return PyLong_FromLongLong(
-      RayConfig::instance().connect_timeout_milliseconds());
+  return PyLong_FromLongLong(RayConfig::instance().connect_timeout_milliseconds());
 }
 
-PyObject *PyRayConfig_local_scheduler_fetch_timeout_milliseconds(
-    PyObject *self) {
+PyObject *PyRayConfig_local_scheduler_fetch_timeout_milliseconds(PyObject *self) {
   return PyLong_FromLongLong(
       RayConfig::instance().local_scheduler_fetch_timeout_milliseconds());
 }
@@ -57,8 +54,7 @@ PyObject *PyRayConfig_local_scheduler_fetch_timeout_milliseconds(
 PyObject *PyRayConfig_local_scheduler_reconstruction_timeout_milliseconds(
     PyObject *self) {
   return PyLong_FromLongLong(
-      RayConfig::instance()
-          .local_scheduler_reconstruction_timeout_milliseconds());
+      RayConfig::instance().local_scheduler_reconstruction_timeout_milliseconds());
 }
 
 PyObject *PyRayConfig_max_num_to_reconstruct(PyObject *self) {
@@ -66,18 +62,15 @@ PyObject *PyRayConfig_max_num_to_reconstruct(PyObject *self) {
 }
 
 PyObject *PyRayConfig_local_scheduler_fetch_request_size(PyObject *self) {
-  return PyLong_FromLongLong(
-      RayConfig::instance().local_scheduler_fetch_request_size());
+  return PyLong_FromLongLong(RayConfig::instance().local_scheduler_fetch_request_size());
 }
 
 PyObject *PyRayConfig_kill_worker_timeout_milliseconds(PyObject *self) {
-  return PyLong_FromLongLong(
-      RayConfig::instance().kill_worker_timeout_milliseconds());
+  return PyLong_FromLongLong(RayConfig::instance().kill_worker_timeout_milliseconds());
 }
 
 PyObject *PyRayConfig_manager_timeout_milliseconds(PyObject *self) {
-  return PyLong_FromLongLong(
-      RayConfig::instance().manager_timeout_milliseconds());
+  return PyLong_FromLongLong(RayConfig::instance().manager_timeout_milliseconds());
 }
 
 PyObject *PyRayConfig_buf_size(PyObject *self) {
@@ -85,8 +78,7 @@ PyObject *PyRayConfig_buf_size(PyObject *self) {
 }
 
 PyObject *PyRayConfig_max_time_for_handler_milliseconds(PyObject *self) {
-  return PyLong_FromLongLong(
-      RayConfig::instance().max_time_for_handler_milliseconds());
+  return PyLong_FromLongLong(RayConfig::instance().max_time_for_handler_milliseconds());
 }
 
 PyObject *PyRayConfig_size_limit(PyObject *self) {
@@ -106,13 +98,11 @@ PyObject *PyRayConfig_redis_db_connect_retries(PyObject *self) {
 }
 
 PyObject *PyRayConfig_redis_db_connect_wait_milliseconds(PyObject *self) {
-  return PyLong_FromLongLong(
-      RayConfig::instance().redis_db_connect_wait_milliseconds());
+  return PyLong_FromLongLong(RayConfig::instance().redis_db_connect_wait_milliseconds());
 }
 
 PyObject *PyRayConfig_plasma_default_release_delay(PyObject *self) {
-  return PyLong_FromLongLong(
-      RayConfig::instance().plasma_default_release_delay());
+  return PyLong_FromLongLong(RayConfig::instance().plasma_default_release_delay());
 }
 
 PyObject *PyRayConfig_L3_cache_size_bytes(PyObject *self) {
@@ -120,70 +110,62 @@ PyObject *PyRayConfig_L3_cache_size_bytes(PyObject *self) {
 }
 
 static PyMethodDef PyRayConfig_methods[] = {
-    {"ray_protocol_version", (PyCFunction) PyRayConfig_ray_protocol_version,
-     METH_NOARGS, "Return ray_protocol_version"},
+    {"ray_protocol_version", (PyCFunction)PyRayConfig_ray_protocol_version, METH_NOARGS,
+     "Return ray_protocol_version"},
     {"heartbeat_timeout_milliseconds",
-     (PyCFunction) PyRayConfig_heartbeat_timeout_milliseconds, METH_NOARGS,
+     (PyCFunction)PyRayConfig_heartbeat_timeout_milliseconds, METH_NOARGS,
      "Return heartbeat_timeout_milliseconds"},
-    {"num_heartbeats_timeout", (PyCFunction) PyRayConfig_num_heartbeats_timeout,
+    {"num_heartbeats_timeout", (PyCFunction)PyRayConfig_num_heartbeats_timeout,
      METH_NOARGS, "Return num_heartbeats_timeout"},
-    {"get_timeout_milliseconds",
-     (PyCFunction) PyRayConfig_get_timeout_milliseconds, METH_NOARGS,
-     "Return get_timeout_milliseconds"},
-    {"worker_get_request_size",
-     (PyCFunction) PyRayConfig_worker_get_request_size, METH_NOARGS,
-     "Return worker_get_request_size"},
-    {"worker_fetch_request_size",
-     (PyCFunction) PyRayConfig_worker_fetch_request_size, METH_NOARGS,
-     "Return worker_fetch_request_size"},
-    {"actor_max_dummy_objects",
-     (PyCFunction) PyRayConfig_actor_max_dummy_objects, METH_NOARGS,
-     "Return actor_max_dummy_objects"},
-    {"num_connect_attempts", (PyCFunction) PyRayConfig_num_connect_attempts,
-     METH_NOARGS, "Return num_connect_attempts"},
+    {"get_timeout_milliseconds", (PyCFunction)PyRayConfig_get_timeout_milliseconds,
+     METH_NOARGS, "Return get_timeout_milliseconds"},
+    {"worker_get_request_size", (PyCFunction)PyRayConfig_worker_get_request_size,
+     METH_NOARGS, "Return worker_get_request_size"},
+    {"worker_fetch_request_size", (PyCFunction)PyRayConfig_worker_fetch_request_size,
+     METH_NOARGS, "Return worker_fetch_request_size"},
+    {"actor_max_dummy_objects", (PyCFunction)PyRayConfig_actor_max_dummy_objects,
+     METH_NOARGS, "Return actor_max_dummy_objects"},
+    {"num_connect_attempts", (PyCFunction)PyRayConfig_num_connect_attempts, METH_NOARGS,
+     "Return num_connect_attempts"},
     {"connect_timeout_milliseconds",
-     (PyCFunction) PyRayConfig_connect_timeout_milliseconds, METH_NOARGS,
+     (PyCFunction)PyRayConfig_connect_timeout_milliseconds, METH_NOARGS,
      "Return connect_timeout_milliseconds"},
     {"local_scheduler_fetch_timeout_milliseconds",
-     (PyCFunction) PyRayConfig_local_scheduler_fetch_timeout_milliseconds,
-     METH_NOARGS, "Return local_scheduler_fetch_timeout_milliseconds"},
+     (PyCFunction)PyRayConfig_local_scheduler_fetch_timeout_milliseconds, METH_NOARGS,
+     "Return local_scheduler_fetch_timeout_milliseconds"},
     {"local_scheduler_reconstruction_timeout_milliseconds",
-     (PyCFunction)
-         PyRayConfig_local_scheduler_reconstruction_timeout_milliseconds,
+     (PyCFunction)PyRayConfig_local_scheduler_reconstruction_timeout_milliseconds,
      METH_NOARGS, "Return local_scheduler_reconstruction_timeout_milliseconds"},
-    {"max_num_to_reconstruct", (PyCFunction) PyRayConfig_max_num_to_reconstruct,
+    {"max_num_to_reconstruct", (PyCFunction)PyRayConfig_max_num_to_reconstruct,
      METH_NOARGS, "Return max_num_to_reconstruct"},
     {"local_scheduler_fetch_request_size",
-     (PyCFunction) PyRayConfig_local_scheduler_fetch_request_size, METH_NOARGS,
+     (PyCFunction)PyRayConfig_local_scheduler_fetch_request_size, METH_NOARGS,
      "Return local_scheduler_fetch_request_size"},
     {"kill_worker_timeout_milliseconds",
-     (PyCFunction) PyRayConfig_kill_worker_timeout_milliseconds, METH_NOARGS,
+     (PyCFunction)PyRayConfig_kill_worker_timeout_milliseconds, METH_NOARGS,
      "Return kill_worker_timeout_milliseconds"},
     {"manager_timeout_milliseconds",
-     (PyCFunction) PyRayConfig_manager_timeout_milliseconds, METH_NOARGS,
+     (PyCFunction)PyRayConfig_manager_timeout_milliseconds, METH_NOARGS,
      "Return manager_timeout_milliseconds"},
-    {"buf_size", (PyCFunction) PyRayConfig_buf_size, METH_NOARGS,
-     "Return buf_size"},
+    {"buf_size", (PyCFunction)PyRayConfig_buf_size, METH_NOARGS, "Return buf_size"},
     {"max_time_for_handler_milliseconds",
-     (PyCFunction) PyRayConfig_max_time_for_handler_milliseconds, METH_NOARGS,
+     (PyCFunction)PyRayConfig_max_time_for_handler_milliseconds, METH_NOARGS,
      "Return max_time_for_handler_milliseconds"},
-    {"size_limit", (PyCFunction) PyRayConfig_size_limit, METH_NOARGS,
-     "Return size_limit"},
-    {"num_elements_limit", (PyCFunction) PyRayConfig_num_elements_limit,
-     METH_NOARGS, "Return num_elements_limit"},
-    {"max_time_for_loop", (PyCFunction) PyRayConfig_max_time_for_loop,
-     METH_NOARGS, "Return max_time_for_loop"},
-    {"redis_db_connect_retries",
-     (PyCFunction) PyRayConfig_redis_db_connect_retries, METH_NOARGS,
-     "Return redis_db_connect_retries"},
+    {"size_limit", (PyCFunction)PyRayConfig_size_limit, METH_NOARGS, "Return size_limit"},
+    {"num_elements_limit", (PyCFunction)PyRayConfig_num_elements_limit, METH_NOARGS,
+     "Return num_elements_limit"},
+    {"max_time_for_loop", (PyCFunction)PyRayConfig_max_time_for_loop, METH_NOARGS,
+     "Return max_time_for_loop"},
+    {"redis_db_connect_retries", (PyCFunction)PyRayConfig_redis_db_connect_retries,
+     METH_NOARGS, "Return redis_db_connect_retries"},
     {"redis_db_connect_wait_milliseconds",
-     (PyCFunction) PyRayConfig_redis_db_connect_wait_milliseconds, METH_NOARGS,
+     (PyCFunction)PyRayConfig_redis_db_connect_wait_milliseconds, METH_NOARGS,
      "Return redis_db_connect_wait_milliseconds"},
     {"plasma_default_release_delay",
-     (PyCFunction) PyRayConfig_plasma_default_release_delay, METH_NOARGS,
+     (PyCFunction)PyRayConfig_plasma_default_release_delay, METH_NOARGS,
      "Return plasma_default_release_delay"},
-    {"L3_cache_size_bytes", (PyCFunction) PyRayConfig_L3_cache_size_bytes,
-     METH_NOARGS, "Return L3_cache_size_bytes"},
+    {"L3_cache_size_bytes", (PyCFunction)PyRayConfig_L3_cache_size_bytes, METH_NOARGS,
+     "Return L3_cache_size_bytes"},
     {NULL} /* Sentinel */
 };
 
diff --git a/src/common/lib/python/config_extension.h b/src/ray/raylet/lib/python/config_extension.h
similarity index 96%
rename from src/common/lib/python/config_extension.h
rename to src/ray/raylet/lib/python/config_extension.h
index e0c850cd72546..3cd4f56afc4c6 100644
--- a/src/common/lib/python/config_extension.h
+++ b/src/ray/raylet/lib/python/config_extension.h
@@ -3,8 +3,6 @@
 
 #include <Python.h>
 
-#include "common.h"
-
 // clang-format off
 typedef struct {
   PyObject_HEAD
@@ -25,10 +23,8 @@ PyObject *PyRayConfig_worker_fetch_request_size(PyObject *self);
 PyObject *PyRayConfig_actor_max_dummy_objects(PyObject *self);
 PyObject *PyRayConfig_num_connect_attempts(PyObject *self);
 PyObject *PyRayConfig_connect_timeout_milliseconds(PyObject *self);
-PyObject *PyRayConfig_local_scheduler_fetch_timeout_milliseconds(
-    PyObject *self);
-PyObject *PyRayConfig_local_scheduler_reconstruction_timeout_milliseconds(
-    PyObject *self);
+PyObject *PyRayConfig_local_scheduler_fetch_timeout_milliseconds(PyObject *self);
+PyObject *PyRayConfig_local_scheduler_reconstruction_timeout_milliseconds(PyObject *self);
 PyObject *PyRayConfig_max_num_to_reconstruct(PyObject *self);
 PyObject *PyRayConfig_local_scheduler_fetch_request_size(PyObject *self);
 PyObject *PyRayConfig_kill_worker_timeout_milliseconds(PyObject *self);
diff --git a/src/local_scheduler/lib/python/local_scheduler_extension.cc b/src/ray/raylet/lib/python/local_scheduler_extension.cc
similarity index 52%
rename from src/local_scheduler/lib/python/local_scheduler_extension.cc
rename to src/ray/raylet/lib/python/local_scheduler_extension.cc
index d473a4eb9c601..8d048009205b0 100644
--- a/src/local_scheduler/lib/python/local_scheduler_extension.cc
+++ b/src/ray/raylet/lib/python/local_scheduler_extension.cc
@@ -1,9 +1,9 @@
 #include <Python.h>
+#include <sstream>
 
 #include "common_extension.h"
 #include "config_extension.h"
-#include "local_scheduler_client.h"
-#include "task.h"
+#include "ray/raylet/local_scheduler_client.h"
 
 PyObject *LocalSchedulerError;
 
@@ -14,24 +14,20 @@ typedef struct {
 } PyLocalSchedulerClient;
 // clang-format on
 
-static int PyLocalSchedulerClient_init(PyLocalSchedulerClient *self,
-                                       PyObject *args,
+static int PyLocalSchedulerClient_init(PyLocalSchedulerClient *self, PyObject *args,
                                        PyObject *kwds) {
   char *socket_name;
   UniqueID client_id;
   PyObject *is_worker;
   JobID driver_id;
-  PyObject *use_raylet;
-  if (!PyArg_ParseTuple(args, "sO&OO&O", &socket_name, PyStringToUniqueID,
-                        &client_id, &is_worker, &PyObjectToUniqueID, &driver_id,
-                        &use_raylet)) {
+  if (!PyArg_ParseTuple(args, "sO&OO&", &socket_name, PyStringToUniqueID, &client_id,
+                        &is_worker, &PyObjectToUniqueID, &driver_id)) {
     self->local_scheduler_connection = NULL;
     return -1;
   }
   /* Connect to the local scheduler. */
   self->local_scheduler_connection = LocalSchedulerConnection_init(
-      socket_name, client_id, static_cast<bool>(PyObject_IsTrue(is_worker)),
-      driver_id, static_cast<bool>(PyObject_IsTrue(use_raylet)),
+      socket_name, client_id, static_cast<bool>(PyObject_IsTrue(is_worker)), driver_id,
       Language::PYTHON);
   return 0;
 }
@@ -40,12 +36,12 @@ static void PyLocalSchedulerClient_dealloc(PyLocalSchedulerClient *self) {
   if (self->local_scheduler_connection != NULL) {
     LocalSchedulerConnection_free(self->local_scheduler_connection);
   }
-  Py_TYPE(self)->tp_free((PyObject *) self);
+  Py_TYPE(self)->tp_free((PyObject *)self);
 }
 
 static PyObject *PyLocalSchedulerClient_disconnect(PyObject *self) {
   local_scheduler_disconnect_client(
-      ((PyLocalSchedulerClient *) self)->local_scheduler_connection);
+      ((PyLocalSchedulerClient *)self)->local_scheduler_connection);
   Py_RETURN_NONE;
 }
 
@@ -55,49 +51,36 @@ static PyObject *PyLocalSchedulerClient_submit(PyObject *self, PyObject *args) {
     return NULL;
   }
   LocalSchedulerConnection *connection =
-      reinterpret_cast<PyLocalSchedulerClient *>(self)
-          ->local_scheduler_connection;
+      reinterpret_cast<PyLocalSchedulerClient *>(self)->local_scheduler_connection;
   PyTask *task = reinterpret_cast<PyTask *>(py_task);
 
-  if (!use_raylet(task)) {
-    TaskExecutionSpec execution_spec = TaskExecutionSpec(
-        *task->execution_dependencies, task->spec, task->size);
-    local_scheduler_submit(connection, execution_spec);
-  } else {
-    local_scheduler_submit_raylet(connection, *task->execution_dependencies,
-                                  *task->task_spec);
-  }
+  local_scheduler_submit_raylet(connection, *task->execution_dependencies,
+                                *task->task_spec);
 
   Py_RETURN_NONE;
 }
 
 // clang-format off
 static PyObject *PyLocalSchedulerClient_get_task(PyObject *self) {
-  TaskSpec *task_spec;
-  int64_t task_size;
+  ray::raylet::TaskSpecification *task_spec;
   /* Drop the global interpreter lock while we get a task because
    * local_scheduler_get_task may block for a long time. */
   Py_BEGIN_ALLOW_THREADS
-  if (!reinterpret_cast<PyLocalSchedulerClient *>(self)->local_scheduler_connection->use_raylet) {
-    task_spec = local_scheduler_get_task(
-        reinterpret_cast<PyLocalSchedulerClient *>(self)->local_scheduler_connection,
-        &task_size);
-  } else {
-    task_spec = local_scheduler_get_task_raylet(
-        reinterpret_cast<PyLocalSchedulerClient *>(self)->local_scheduler_connection,
-        &task_size);
-  }
+  task_spec = local_scheduler_get_task_raylet(
+      reinterpret_cast<PyLocalSchedulerClient *>(self)->local_scheduler_connection);
   Py_END_ALLOW_THREADS
-  return PyTask_make(task_spec, task_size);
+  return PyTask_make(task_spec);
 }
 // clang-format on
 
-static PyObject *PyLocalSchedulerClient_reconstruct_objects(PyObject *self,
-                                                            PyObject *args) {
+static PyObject *PyLocalSchedulerClient_fetch_or_reconstruct(PyObject *self,
+                                                             PyObject *args) {
   PyObject *py_object_ids;
   PyObject *py_fetch_only;
   std::vector<ObjectID> object_ids;
-  if (!PyArg_ParseTuple(args, "OO", &py_object_ids, &py_fetch_only)) {
+  TaskID current_task_id;
+  if (!PyArg_ParseTuple(args, "OO|O&", &py_object_ids, &py_fetch_only,
+                        &PyObjectToUniqueID, &current_task_id)) {
     return NULL;
   }
   bool fetch_only = PyObject_IsTrue(py_fetch_only);
@@ -110,65 +93,47 @@ static PyObject *PyLocalSchedulerClient_reconstruct_objects(PyObject *self,
     }
     object_ids.push_back(object_id);
   }
-  local_scheduler_reconstruct_objects(
-      reinterpret_cast<PyLocalSchedulerClient *>(self)
-          ->local_scheduler_connection,
-      object_ids, fetch_only);
-  Py_RETURN_NONE;
+  int ret = local_scheduler_fetch_or_reconstruct(
+      reinterpret_cast<PyLocalSchedulerClient *>(self)->local_scheduler_connection,
+      object_ids, fetch_only, current_task_id);
+  if (ret == 0) {
+    Py_RETURN_NONE;
+  } else {
+    std::ostringstream stream;
+    stream << "local_scheduler_fetch_or_reconstruct failed: "
+           << "local scheduler connection may be closed, "
+           << "check raylet status. return value: " << ret;
+    PyErr_SetString(CommonError, stream.str().c_str());
+    Py_RETURN_NONE;
+  }
 }
 
-static PyObject *PyLocalSchedulerClient_log_event(PyObject *self,
-                                                  PyObject *args) {
-  const char *key;
-  int key_length;
-  const char *value;
-  int value_length;
-  double timestamp;
-  if (!PyArg_ParseTuple(args, "s#s#d", &key, &key_length, &value, &value_length,
-                        &timestamp)) {
+static PyObject *PyLocalSchedulerClient_notify_unblocked(PyObject *self, PyObject *args) {
+  TaskID current_task_id;
+  if (!PyArg_ParseTuple(args, "O&", &PyObjectToUniqueID, &current_task_id)) {
     return NULL;
   }
-  local_scheduler_log_event(
-      ((PyLocalSchedulerClient *) self)->local_scheduler_connection,
-      (uint8_t *) key, key_length, (uint8_t *) value, value_length, timestamp);
-  Py_RETURN_NONE;
-}
-
-static PyObject *PyLocalSchedulerClient_notify_unblocked(PyObject *self) {
   local_scheduler_notify_unblocked(
-      ((PyLocalSchedulerClient *) self)->local_scheduler_connection);
+      ((PyLocalSchedulerClient *)self)->local_scheduler_connection, current_task_id);
   Py_RETURN_NONE;
 }
 
-static PyObject *PyLocalSchedulerClient_compute_put_id(PyObject *self,
-                                                       PyObject *args) {
+static PyObject *PyLocalSchedulerClient_compute_put_id(PyObject *self, PyObject *args) {
   int put_index;
   TaskID task_id;
-  PyObject *use_raylet;
-  if (!PyArg_ParseTuple(args, "O&iO", &PyObjectToUniqueID, &task_id, &put_index,
-                        &use_raylet)) {
+  if (!PyArg_ParseTuple(args, "O&i", &PyObjectToUniqueID, &task_id, &put_index)) {
     return NULL;
   }
-  ObjectID put_id;
-  if (!PyObject_IsTrue(use_raylet)) {
-    put_id = task_compute_put_id(task_id, put_index);
-    local_scheduler_put_object(
-        ((PyLocalSchedulerClient *) self)->local_scheduler_connection, task_id,
-        put_id);
-  } else {
-    // TODO(rkn): Raise an exception if the put index is not a valid value
-    // instead of crashing in ComputePutId.
-    put_id = ray::ComputePutId(task_id, put_index);
-  }
+  const ObjectID put_id = ComputePutId(task_id, put_index);
   return PyObjectID_make(put_id);
 }
 
 static PyObject *PyLocalSchedulerClient_gpu_ids(PyObject *self) {
   /* Construct a Python list of GPU IDs. */
   std::vector<int> gpu_ids =
-      ((PyLocalSchedulerClient *) self)->local_scheduler_connection->gpu_ids;
+      ((PyLocalSchedulerClient *)self)->local_scheduler_connection->gpu_ids;
   int num_gpu_ids = gpu_ids.size();
-  PyObject *gpu_ids_list = PyList_New((Py_ssize_t) num_gpu_ids);
+  PyObject *gpu_ids_list = PyList_New((Py_ssize_t)num_gpu_ids);
   for (int i = 0; i < num_gpu_ids; ++i) {
     PyList_SetItem(gpu_ids_list, i, PyLong_FromLong(gpu_ids[i]));
   }
@@ -180,9 +145,8 @@ static PyObject *PyLocalSchedulerClient_resource_ids(PyObject *self) {
   // Construct a Python dictionary of resource IDs and resource fractions.
   PyObject *resource_ids = PyDict_New();
 
-  for (auto const &resource_info :
-       reinterpret_cast<PyLocalSchedulerClient *>(self)
-           ->local_scheduler_connection->resource_ids_) {
+  for (auto const &resource_info : reinterpret_cast<PyLocalSchedulerClient *>(self)
+                                       ->local_scheduler_connection->resource_ids_) {
     auto const &resource_name = resource_info.first;
     auto const &ids_and_fractions = resource_info.second;
 
@@ -190,8 +154,7 @@ static PyObject *PyLocalSchedulerClient_resource_ids(PyObject *self) {
     PyObject *key =
         PyUnicode_FromStringAndSize(resource_name.data(), resource_name.size());
 #else
-    PyObject *key =
-        PyBytes_FromStringAndSize(resource_name.data(), resource_name.size());
+    PyObject *key = PyBytes_FromStringAndSize(resource_name.data(), resource_name.size());
 #endif
     PyObject *value = PyList_New(ids_and_fractions.size());
     for (size_t i = 0; i < ids_and_fractions.size(); ++i) {
@@ -208,43 +171,15 @@ static PyObject *PyLocalSchedulerClient_resource_ids(PyObject *self) {
   return resource_ids;
 }
 
-static PyObject *PyLocalSchedulerClient_get_actor_frontier(PyObject *self,
-                                                           PyObject *args) {
-  ActorID actor_id;
-  if (!PyArg_ParseTuple(args, "O&", &PyObjectToUniqueID, &actor_id)) {
-    return NULL;
-  }
-
-  auto frontier = local_scheduler_get_actor_frontier(
-      ((PyLocalSchedulerClient *) self)->local_scheduler_connection, actor_id);
-  return PyBytes_FromStringAndSize(
-      reinterpret_cast<const char *>(frontier.data()), frontier.size());
-}
-
-static PyObject *PyLocalSchedulerClient_set_actor_frontier(PyObject *self,
-                                                           PyObject *args) {
-  PyObject *py_frontier;
-  if (!PyArg_ParseTuple(args, "O", &py_frontier)) {
-    return NULL;
-  }
-
-  std::vector<uint8_t> frontier;
-  Py_ssize_t length = PyBytes_Size(py_frontier);
-  char *frontier_data = PyBytes_AsString(py_frontier);
-  frontier.assign(frontier_data, frontier_data + length);
-  local_scheduler_set_actor_frontier(
-      ((PyLocalSchedulerClient *) self)->local_scheduler_connection, frontier);
-  Py_RETURN_NONE;
-}
-
 static PyObject *PyLocalSchedulerClient_wait(PyObject *self, PyObject *args) {
   PyObject *py_object_ids;
   int num_returns;
   int64_t timeout_ms;
   PyObject *py_wait_local;
+  TaskID current_task_id;
 
-  if (!PyArg_ParseTuple(args, "OilO", &py_object_ids, &num_returns, &timeout_ms,
-                        &py_wait_local)) {
+  if (!PyArg_ParseTuple(args, "OilOO&", &py_object_ids, &num_returns, &timeout_ms,
+                        &py_wait_local, &PyObjectToUniqueID, &current_task_id)) {
     return NULL;
   }
 
@@ -270,27 +205,23 @@ static PyObject *PyLocalSchedulerClient_wait(PyObject *self, PyObject *args) {
   }
 
   // Invoke wait.
-  std::pair<std::vector<ObjectID>, std::vector<ObjectID>> result =
-      local_scheduler_wait(reinterpret_cast<PyLocalSchedulerClient *>(self)
-                               ->local_scheduler_connection,
-                           object_ids, num_returns, timeout_ms,
-                           static_cast<bool>(wait_local));
+  std::pair<std::vector<ObjectID>, std::vector<ObjectID>> result = local_scheduler_wait(
+      reinterpret_cast<PyLocalSchedulerClient *>(self)->local_scheduler_connection,
+      object_ids, num_returns, timeout_ms, wait_local, current_task_id);
 
   // Convert result to py object.
   PyObject *py_found = PyList_New(static_cast<Py_ssize_t>(result.first.size()));
   for (uint i = 0; i < result.first.size(); ++i) {
     PyList_SetItem(py_found, i, PyObjectID_make(result.first[i]));
   }
-  PyObject *py_remaining =
-      PyList_New(static_cast<Py_ssize_t>(result.second.size()));
+  PyObject *py_remaining = PyList_New(static_cast<Py_ssize_t>(result.second.size()));
   for (uint i = 0; i < result.second.size(); ++i) {
     PyList_SetItem(py_remaining, i, PyObjectID_make(result.second[i]));
   }
   return Py_BuildValue("(OO)", py_found, py_remaining);
 }
 
-static PyObject *PyLocalSchedulerClient_push_error(PyObject *self,
-                                                   PyObject *args) {
+static PyObject *PyLocalSchedulerClient_push_error(PyObject *self, PyObject *args) {
   JobID job_id;
   const char *type;
   int type_length;
@@ -303,11 +234,10 @@ static PyObject *PyLocalSchedulerClient_push_error(PyObject *self,
     return NULL;
   }
 
-  local_scheduler_push_error(reinterpret_cast<PyLocalSchedulerClient *>(self)
-                                 ->local_scheduler_connection,
-                             job_id, std::string(type, type_length),
-                             std::string(error_message, error_message_length),
-                             timestamp);
+  local_scheduler_push_error(
+      reinterpret_cast<PyLocalSchedulerClient *>(self)->local_scheduler_connection,
+      job_id, std::string(type, type_length),
+      std::string(error_message, error_message_length), timestamp);
 
   Py_RETURN_NONE;
 }
@@ -317,8 +247,7 @@ int PyBytes_or_PyUnicode_to_string(PyObject *py_string, std::string &out) {
   // is a unicode object.
   if (PyUnicode_Check(py_string)) {
     PyObject *ascii_string = PyUnicode_AsASCIIString(py_string);
-    out =
-        std::string(PyBytes_AsString(ascii_string), PyBytes_Size(ascii_string));
+    out = std::string(PyBytes_AsString(ascii_string), PyBytes_Size(ascii_string));
     Py_DECREF(ascii_string);
   } else if (PyBytes_Check(py_string)) {
     out = std::string(PyBytes_AsString(py_string), PyBytes_Size(py_string));
@@ -338,19 +267,16 @@ static PyObject *PyLocalSchedulerClient_push_profile_events(PyObject *self,
   const char *node_ip_address;
   int node_ip_address_length;
 
-  if (!PyArg_ParseTuple(args, "s#O&s#O", &component_type,
-                        &component_type_length, &PyObjectToUniqueID,
-                        &component_id, &node_ip_address,
+  if (!PyArg_ParseTuple(args, "s#O&s#O", &component_type, &component_type_length,
+                        &PyObjectToUniqueID, &component_id, &node_ip_address,
                         &node_ip_address_length, &profile_data)) {
     return NULL;
   }
 
   ProfileTableDataT profile_info;
-  profile_info.component_type =
-      std::string(component_type, component_type_length);
+  profile_info.component_type = std::string(component_type, component_type_length);
   profile_info.component_id = component_id.binary();
-  profile_info.node_ip_address =
-      std::string(node_ip_address, node_ip_address_length);
+  profile_info.node_ip_address = std::string(node_ip_address, node_ip_address_length);
 
   if (PyList_Size(profile_data) == 0) {
     // Short circuit if there are no profile events.
@@ -378,8 +304,7 @@ static PyObject *PyLocalSchedulerClient_push_profile_events(PyObject *self,
       // segfaults in the node manager.
 
       if (key_string == std::string("event_type")) {
-        if (PyBytes_or_PyUnicode_to_string(val, profile_event.event_type) ==
-            -1) {
+        if (PyBytes_or_PyUnicode_to_string(val, profile_event.event_type) == -1) {
           return NULL;
         }
         if (profile_event.event_type.size() == 0) {
@@ -390,8 +315,7 @@ static PyObject *PyLocalSchedulerClient_push_profile_events(PyObject *self,
       } else if (key_string == std::string("end_time")) {
         profile_event.end_time = PyFloat_AsDouble(val);
       } else if (key_string == std::string("extra_data")) {
-        if (PyBytes_or_PyUnicode_to_string(val, profile_event.extra_data) ==
-            -1) {
+        if (PyBytes_or_PyUnicode_to_string(val, profile_event.extra_data) == -1) {
           return NULL;
         }
         if (profile_event.extra_data.size() == 0) {
@@ -408,8 +332,7 @@ static PyObject *PyLocalSchedulerClient_push_profile_events(PyObject *self,
   }
 
   local_scheduler_push_profile_events(
-      reinterpret_cast<PyLocalSchedulerClient *>(self)
-          ->local_scheduler_connection,
+      reinterpret_cast<PyLocalSchedulerClient *>(self)->local_scheduler_connection,
       profile_info);
 
   Py_RETURN_NONE;
@@ -446,88 +369,78 @@ static PyObject *PyLocalSchedulerClient_free(PyObject *self, PyObject *args) {
 
   // Invoke local_scheduler_free_objects_in_object_store.
   local_scheduler_free_objects_in_object_store(
-      reinterpret_cast<PyLocalSchedulerClient *>(self)
-          ->local_scheduler_connection,
+      reinterpret_cast<PyLocalSchedulerClient *>(self)->local_scheduler_connection,
       object_ids, local_only);
   Py_RETURN_NONE;
 }
 
 static PyMethodDef PyLocalSchedulerClient_methods[] = {
-    {"disconnect", (PyCFunction) PyLocalSchedulerClient_disconnect, METH_NOARGS,
+    {"disconnect", (PyCFunction)PyLocalSchedulerClient_disconnect, METH_NOARGS,
      "Notify the local scheduler that this client is exiting gracefully."},
-    {"submit", (PyCFunction) PyLocalSchedulerClient_submit, METH_VARARGS,
+    {"submit", (PyCFunction)PyLocalSchedulerClient_submit, METH_VARARGS,
      "Submit a task to the local scheduler."},
-    {"get_task", (PyCFunction) PyLocalSchedulerClient_get_task, METH_NOARGS,
+    {"get_task", (PyCFunction)PyLocalSchedulerClient_get_task, METH_NOARGS,
      "Get a task from the local scheduler."},
-    {"reconstruct_objects",
-     (PyCFunction) PyLocalSchedulerClient_reconstruct_objects, METH_VARARGS,
-     "Ask the local scheduler to reconstruct an object."},
-    {"log_event", (PyCFunction) PyLocalSchedulerClient_log_event, METH_VARARGS,
-     "Log an event to the event log through the local scheduler."},
-    {"notify_unblocked", (PyCFunction) PyLocalSchedulerClient_notify_unblocked,
-     METH_NOARGS, "Notify the local scheduler that we are unblocked."},
-    {"compute_put_id", (PyCFunction) PyLocalSchedulerClient_compute_put_id,
-     METH_VARARGS, "Return the object ID for a put call within a task."},
-    {"gpu_ids", (PyCFunction) PyLocalSchedulerClient_gpu_ids, METH_NOARGS,
+    {"fetch_or_reconstruct", (PyCFunction)PyLocalSchedulerClient_fetch_or_reconstruct,
+     METH_VARARGS, "Ask the local scheduler to reconstruct an object."},
+    {"notify_unblocked", (PyCFunction)PyLocalSchedulerClient_notify_unblocked,
+     METH_VARARGS, "Notify the local scheduler that we are unblocked."},
+    {"compute_put_id", (PyCFunction)PyLocalSchedulerClient_compute_put_id, METH_VARARGS,
+     "Return the object ID for a put call within a task."},
+    {"gpu_ids", (PyCFunction)PyLocalSchedulerClient_gpu_ids, METH_NOARGS,
      "Get the IDs of the GPUs that are reserved for this client."},
-    {"resource_ids", (PyCFunction) PyLocalSchedulerClient_resource_ids,
-     METH_NOARGS,
+    {"resource_ids", (PyCFunction)PyLocalSchedulerClient_resource_ids, METH_NOARGS,
      "Get the IDs of the resources that are reserved for this client."},
-    {"get_actor_frontier",
-     (PyCFunction) PyLocalSchedulerClient_get_actor_frontier, METH_VARARGS, ""},
-    {"set_actor_frontier",
-     (PyCFunction) PyLocalSchedulerClient_set_actor_frontier, METH_VARARGS, ""},
-    {"wait", (PyCFunction) PyLocalSchedulerClient_wait, METH_VARARGS,
+    {"wait", (PyCFunction)PyLocalSchedulerClient_wait, METH_VARARGS,
      "Wait for a list of objects to be created."},
-    {"push_error", (PyCFunction) PyLocalSchedulerClient_push_error,
-     METH_VARARGS, "Push an error message to the relevant driver."},
-    {"push_profile_events",
-     (PyCFunction) PyLocalSchedulerClient_push_profile_events, METH_VARARGS,
-     "Store some profiling events in the GCS."},
-    {"free", (PyCFunction) PyLocalSchedulerClient_free, METH_VARARGS,
+    {"push_error", (PyCFunction)PyLocalSchedulerClient_push_error, METH_VARARGS,
+     "Push an error message to the relevant driver."},
+    {"push_profile_events", (PyCFunction)PyLocalSchedulerClient_push_profile_events,
+     METH_VARARGS, "Store some profiling events in the GCS."},
+    {"free", (PyCFunction)PyLocalSchedulerClient_free, METH_VARARGS,
      "Free a list of objects from object stores."},
     {NULL} /* Sentinel */
 };
 
 static PyTypeObject PyLocalSchedulerClientType = {
-    PyVarObject_HEAD_INIT(NULL, 0)               /* ob_size */
-    "local_scheduler.LocalSchedulerClient",      /* tp_name */
-    sizeof(PyLocalSchedulerClient),              /* tp_basicsize */
-    0,                                           /* tp_itemsize */
-    (destructor) PyLocalSchedulerClient_dealloc, /* tp_dealloc */
-    0,                                           /* tp_print */
-    0,                                           /* tp_getattr */
-    0,                                           /* tp_setattr */
-    0,                                           /* tp_compare */
-    0,                                           /* tp_repr */
-    0,                                           /* tp_as_number */
-    0,                                           /* tp_as_sequence */
-    0,                                           /* tp_as_mapping */
-    0,                                           /* tp_hash */
-    0,                                           /* tp_call */
-    0,                                           /* tp_str */
-    0,                                           /* tp_getattro */
-    0,                                           /* tp_setattro */
-    0,                                           /* tp_as_buffer */
-    Py_TPFLAGS_DEFAULT,                          /* tp_flags */
-    "LocalSchedulerClient object",               /* tp_doc */
-    0,                                           /* tp_traverse */
-    0,                                           /* tp_clear */
-    0,                                           /* tp_richcompare */
-    0,                                           /* tp_weaklistoffset */
-    0,                                           /* tp_iter */
-    0,                                           /* tp_iternext */
-    PyLocalSchedulerClient_methods,              /* tp_methods */
-    0,                                           /* tp_members */
-    0,                                           /* tp_getset */
-    0,                                           /* tp_base */
-    0,                                           /* tp_dict */
-    0,                                           /* tp_descr_get */
-    0,                                           /* tp_descr_set */
-    0,                                           /* tp_dictoffset */
-    (initproc) PyLocalSchedulerClient_init,      /* tp_init */
-    0,                                           /* tp_alloc */
-    PyType_GenericNew,                           /* tp_new */
+    PyVarObject_HEAD_INIT(NULL, 0)              /* ob_size */
+    "local_scheduler.LocalSchedulerClient",     /* tp_name */
+    sizeof(PyLocalSchedulerClient),             /* tp_basicsize */
+    0,                                          /* tp_itemsize */
+    (destructor)PyLocalSchedulerClient_dealloc, /* tp_dealloc */
+    0,                                          /* tp_print */
+    0,                                          /* tp_getattr */
+    0,                                          /* tp_setattr */
+    0,                                          /* tp_compare */
+    0,                                          /* tp_repr */
+    0,                                          /* tp_as_number */
+    0,                                          /* tp_as_sequence */
+    0,                                          /* tp_as_mapping */
+    0,                                          /* tp_hash */
+    0,                                          /* tp_call */
+    0,                                          /* tp_str */
+    0,                                          /* tp_getattro */
+    0,                                          /* tp_setattro */
+    0,                                          /* tp_as_buffer */
+    Py_TPFLAGS_DEFAULT,                         /* tp_flags */
+    "LocalSchedulerClient object",              /* tp_doc */
+    0,                                          /* tp_traverse */
+    0,                                          /* tp_clear */
+    0,                                          /* tp_richcompare */
+    0,                                          /* tp_weaklistoffset */
+    0,                                          /* tp_iter */
+    0,                                          /* tp_iternext */
+    PyLocalSchedulerClient_methods,             /* tp_methods */
+    0,                                          /* tp_members */
+    0,                                          /* tp_getset */
+    0,                                          /* tp_base */
+    0,                                          /* tp_dict */
+    0,                                          /* tp_descr_get */
+    0,                                          /* tp_descr_set */
+    0,                                          /* tp_dictoffset */
+    (initproc)PyLocalSchedulerClient_init,      /* tp_init */
+    0,                                          /* tp_alloc */
+    PyType_GenericNew,                          /* tp_new */
 };
 
 static PyMethodDef local_scheduler_methods[] = {
@@ -593,25 +506,22 @@ MOD_INIT(liblocal_scheduler_library_python) {
 #if PY_MAJOR_VERSION >= 3
   PyObject *m = PyModule_Create(&moduledef);
 #else
-  PyObject *m = Py_InitModule3("liblocal_scheduler_library_python",
-                               local_scheduler_methods,
-                               "A module for the local scheduler.");
+  PyObject *m =
+      Py_InitModule3("liblocal_scheduler_library_python", local_scheduler_methods,
+                     "A module for the local scheduler.");
 #endif
 
   init_numpy_module();
   init_pickle_module();
 
   Py_INCREF(&PyTaskType);
-  PyModule_AddObject(m, "Task", (PyObject *) &PyTaskType);
+  PyModule_AddObject(m, "Task", (PyObject *)&PyTaskType);
 
   Py_INCREF(&PyObjectIDType);
-  PyModule_AddObject(m, "ObjectID", (PyObject *) &PyObjectIDType);
+  PyModule_AddObject(m, "ObjectID", (PyObject *)&PyObjectIDType);
 
   Py_INCREF(&PyLocalSchedulerClientType);
-  PyModule_AddObject(m, "LocalSchedulerClient",
-                     (PyObject *) &PyLocalSchedulerClientType);
-
-  g_task_builder = make_task_builder();
+  PyModule_AddObject(m, "LocalSchedulerClient", (PyObject *)&PyLocalSchedulerClientType);
 
   char common_error[] = "common.error";
   CommonError = PyErr_NewException(common_error, NULL, NULL);
@@ -619,7 +529,7 @@ MOD_INIT(liblocal_scheduler_library_python) {
   PyModule_AddObject(m, "common_error", CommonError);
 
   Py_INCREF(&PyRayConfigType);
-  PyModule_AddObject(m, "RayConfig", (PyObject *) &PyRayConfigType);
+  PyModule_AddObject(m, "RayConfig", (PyObject *)&PyRayConfigType);
 
   /* Create the global config object. */
   PyObject *config = PyRayConfig_make();
diff --git a/src/ray/raylet/lineage_cache.cc b/src/ray/raylet/lineage_cache.cc
index 917d925a758b7..8180319ebf007 100644
--- a/src/ray/raylet/lineage_cache.cc
+++ b/src/ray/raylet/lineage_cache.cc
@@ -1,5 +1,7 @@
 #include "lineage_cache.h"
 
+#include <sstream>
+
 namespace ray {
 
 namespace raylet {
@@ -87,30 +89,72 @@ boost::optional<LineageEntry &> Lineage::GetEntryMutable(const TaskID &task_id)
   }
 }
 
+void Lineage::RemoveChild(const TaskID &parent_id, const TaskID &child_id) {
+  auto parent_it = children_.find(parent_id);
+  RAY_CHECK(parent_it->second.erase(child_id) == 1);
+  if (parent_it->second.empty()) {
+    children_.erase(parent_it);
+  }
+}
+
+void Lineage::AddChild(const TaskID &parent_id, const TaskID &child_id) {
+  auto inserted = children_[parent_id].insert(child_id);
+  RAY_CHECK(inserted.second);
+}
+
 bool Lineage::SetEntry(const Task &task, GcsStatus status) {
   // Get the status of the current entry at the key.
   auto task_id = task.GetTaskSpecification().TaskId();
-  auto current_entry = GetEntryMutable(task_id);
-  if (current_entry) {
-    if (current_entry->SetStatus(status)) {
+  auto it = entries_.find(task_id);
+  bool updated = false;
+  std::unordered_set<TaskID> old_parents;
+  if (it != entries_.end()) {
+    if (it->second.SetStatus(status)) {
+      // The task's spec may have changed, so record its old dependencies.
+      old_parents = it->second.GetParentTaskIds();
       // SetStatus() would check if the new status is greater,
       // if it succeeds, go ahead to update the task field.
-      current_entry->UpdateTaskData(task);
-      return true;
+      it->second.UpdateTaskData(task);
+      updated = true;
     }
-    return false;
   } else {
     LineageEntry new_entry(task, status);
-    entries_.emplace(std::make_pair(task_id, std::move(new_entry)));
-    return true;
+    it = entries_.emplace(std::make_pair(task_id, std::move(new_entry))).first;
+    updated = true;
+  }
+
+  // If the task data was updated, then record which tasks it depends on. Add
+  // all new tasks that it depends on and remove any old tasks that it no
+  // longer depends on.
+  // TODO(swang): Updating the task data every time could be inefficient for
+  // tasks that have lots of dependencies and/or large specs. A flag could be
+  // passed in for tasks whose data has not changed.
+  if (updated) {
+    for (const auto &parent_id : it->second.GetParentTaskIds()) {
+      if (old_parents.count(parent_id) == 0) {
+        AddChild(parent_id, task_id);
+      } else {
+        old_parents.erase(parent_id);
+      }
+    }
+    for (const auto &old_parent_id : old_parents) {
+      RemoveChild(old_parent_id, task_id);
+    }
   }
+  return updated;
 }
 
 boost::optional<LineageEntry> Lineage::PopEntry(const TaskID &task_id) {
   auto entry = entries_.find(task_id);
   if (entry != entries_.end()) {
     LineageEntry entry = std::move(entries_.at(task_id));
+
+    // Remove the task's dependencies.
+    for (const auto &parent_id : entry.GetParentTaskIds()) {
+      RemoveChild(parent_id, task_id);
+    }
     entries_.erase(task_id);
+
     return entry;
   } else {
     return boost::optional<LineageEntry>();
@@ -135,47 +179,43 @@ flatbuffers::Offset<protocol::ForwardTaskRequest> Lineage::ToFlatbuffer(
   return request;
 }
 
+const std::unordered_set<TaskID> &Lineage::GetChildren(const TaskID &task_id) const {
+  static const std::unordered_set<TaskID> empty_children;
+  const auto it = children_.find(task_id);
+  if (it != children_.end()) {
+    return it->second;
+  } else {
+    return empty_children;
+  }
+}
+
 LineageCache::LineageCache(const ClientID &client_id,
                            gcs::TableInterface<TaskID, protocol::Task> &task_storage,
                            gcs::PubsubInterface<TaskID> &task_pubsub,
                            uint64_t max_lineage_size)
-    : client_id_(client_id),
-      task_storage_(task_storage),
-      task_pubsub_(task_pubsub),
-      max_lineage_size_(max_lineage_size) {}
-
-/// A helper function to merge one lineage into another, in DFS order.
-///
-/// \param task_id The current entry to merge from lineage_from into
-/// lineage_to.
-/// \param lineage_from The lineage to merge entries from. This lineage is
-/// traversed by following each entry's parent pointers in DFS order,
-/// until an entry is not found or the stopping condition is reached.
-/// \param lineage_to The lineage to merge entries into.
-/// \param stopping_condition A stopping condition for the DFS over
-/// lineage_from. This should return true if the merge should stop.
-void MergeLineageHelper(const TaskID &task_id, const Lineage &lineage_from,
-                        Lineage &lineage_to,
-                        std::function<bool(const LineageEntry &)> stopping_condition) {
+    : client_id_(client_id), task_storage_(task_storage), task_pubsub_(task_pubsub) {}
+
+/// A helper function to add some uncommitted lineage to the local cache.
+void LineageCache::AddUncommittedLineage(const TaskID &task_id,
+                                         const Lineage &uncommitted_lineage,
+                                         std::unordered_set<TaskID> &subscribe_tasks) {
   // If the entry is not found in the lineage to merge, then we stop since
   // there is nothing to copy into the merged lineage.
-  auto entry = lineage_from.GetEntry(task_id);
+  auto entry = uncommitted_lineage.GetEntry(task_id);
   if (!entry) {
     return;
   }
-  // Check whether we should stop at this entry in the DFS.
-  if (stopping_condition(entry.get())) {
-    return;
-  }
+  RAY_CHECK(entry->GetStatus() == GcsStatus::UNCOMMITTED_REMOTE);
 
-  // Insert a copy of the entry into lineage_to.
+  // Insert a copy of the entry into our cache.
   const auto &parent_ids = entry->GetParentTaskIds();
   // If the insert is successful, then continue the DFS. The insert will fail
   // if the new entry has an equal or lower GCS status than the current entry
-  // in lineage_to. This also prevents us from traversing the same node twice.
-  if (lineage_to.SetEntry(entry->TaskData(), entry->GetStatus())) {
+  // in our cache. This also prevents us from traversing the same node twice.
+  if (lineage_.SetEntry(entry->TaskData(), entry->GetStatus())) {
+    subscribe_tasks.insert(task_id);
     for (const auto &parent_id : parent_ids) {
-      MergeLineageHelper(parent_id, lineage_from, lineage_to, stopping_condition);
+      AddUncommittedLineage(parent_id, uncommitted_lineage, subscribe_tasks);
     }
   }
 }
@@ -183,31 +223,32 @@ void MergeLineageHelper(const TaskID &task_id, const Lineage &lineage_from,
 bool LineageCache::AddWaitingTask(const Task &task, const Lineage &uncommitted_lineage) {
   auto task_id = task.GetTaskSpecification().TaskId();
   RAY_LOG(DEBUG) << "add waiting task " << task_id << " on " << client_id_;
-  // Merge the uncommitted lineage into the lineage cache.
-  MergeLineageHelper(task_id, uncommitted_lineage, lineage_,
-                     [](const LineageEntry &entry) {
-                       if (entry.GetStatus() != GcsStatus::NONE) {
-                         // We received the uncommitted lineage from a remote node, so
-                         // make sure that all entries in the lineage to merge have
-                         // status UNCOMMITTED_REMOTE.
-                         RAY_CHECK(entry.GetStatus() == GcsStatus::UNCOMMITTED_REMOTE);
-                       }
-                       // The only stopping condition is that an entry is not found.
-                       return false;
-                     });
-
-  auto entry = lineage_.GetEntry(task_id);
-  if (entry) {
-    if (entry->GetStatus() == GcsStatus::UNCOMMITTED_REMOTE) {
-      // The task was previously remote, so we may have been subscribed to it.
-      // Unsubscribe since we are now responsible for committing the task.
-      UnsubscribeTask(task_id);
-    }
-  }
 
+  // Merge the uncommitted lineage into the lineage cache. Collect the IDs of
+  // tasks that we should subscribe to. These are all of the tasks that were
+  // included in the uncommitted lineage that we did not already have in our
+  // stash.
+  std::unordered_set<TaskID> subscribe_tasks;
+  AddUncommittedLineage(task_id, uncommitted_lineage, subscribe_tasks);
   // Add the submitted task to the lineage cache as UNCOMMITTED_WAITING. It
   // should be marked as UNCOMMITTED_READY once the task starts execution.
-  return lineage_.SetEntry(task, GcsStatus::UNCOMMITTED_WAITING);
+  auto added = lineage_.SetEntry(task, GcsStatus::UNCOMMITTED_WAITING);
+
+  // Do not subscribe to the waiting task itself. We just added it as
+  // UNCOMMITTED_WAITING, so the task is local.
+  subscribe_tasks.erase(task_id);
+  // Unsubscribe to the waiting task since we may have previously been
+  // subscribed to it.
+  UnsubscribeTask(task_id);
+  // Subscribe to all other tasks that were included in the uncommitted lineage
+  // and that were not already in the local stash. These tasks haven't been
+  // committed yet and will be committed by a different node, so we will not
+  // evict them until a notification for their commit is received.
+  for (const auto &task_id : subscribe_tasks) {
+    RAY_CHECK(SubscribeTask(task_id));
+  }
+
+  return added;
 }
 
 bool LineageCache::AddReadyTask(const Task &task) {
@@ -217,12 +258,7 @@ bool LineageCache::AddReadyTask(const Task &task) {
   // Set the task to READY.
   if (lineage_.SetEntry(task, GcsStatus::UNCOMMITTED_READY)) {
     // Attempt to flush the task.
-    bool flushed = FlushTask(task_id);
-    if (!flushed) {
-      // If we fail to flush the task here, due to uncommitted parents, then add
-      // the task to a cache to be flushed in the future.
-      uncommitted_ready_tasks_.insert(task_id);
-    }
+    FlushTask(task_id);
     return true;
   } else {
     // The task was already ready to be committed (UNCOMMITTED_READY) or
@@ -231,28 +267,6 @@ bool LineageCache::AddReadyTask(const Task &task) {
   }
 }
 
-uint64_t LineageCache::CountUnsubscribedLineage(const TaskID &task_id,
-                                                std::unordered_set<TaskID> &seen) const {
-  if (seen.count(task_id) == 1) {
-    return 0;
-  }
-  seen.insert(task_id);
-  if (subscribed_tasks_.count(task_id) == 1) {
-    return 0;
-  }
-  auto entry = lineage_.GetEntry(task_id);
-  // Only count tasks that are remote. Tasks that are local will be evicted
-  // once they are committed in the GCS, along with their lineage.
-  if (!entry || entry->GetStatus() != GcsStatus::UNCOMMITTED_REMOTE) {
-    return 0;
-  }
-  uint64_t cnt = 1;
-  for (const auto &parent_id : entry->GetParentTaskIds()) {
-    cnt += CountUnsubscribedLineage(parent_id, seen);
-  }
-  return cnt;
-}
-
 bool LineageCache::RemoveWaitingTask(const TaskID &task_id) {
   RAY_LOG(DEBUG) << "remove waiting task " << task_id << " on " << client_id_;
   auto entry = lineage_.GetEntryMutable(task_id);
@@ -274,36 +288,9 @@ bool LineageCache::RemoveWaitingTask(const TaskID &task_id) {
   // completely in case another task is submitted locally that depends on this
   // one.
   entry->ResetStatus(GcsStatus::UNCOMMITTED_REMOTE);
-
-  // Subscribe to the task if necessary. We do this if it has any local
-  // children that must be written to the GCS, or if its uncommitted remote
-  // lineage is too large.
-  if (uncommitted_ready_children_.find(task_id) != uncommitted_ready_children_.end()) {
-    // Subscribe to the task if it has any children in UNCOMMITTED_READY. We
-    // will attempt to flush its children once we receive a notification for
-    // this task's commit.  Since this task was in state WAITING, check that we
-    // were not already subscribed to the task.
-    RAY_CHECK(SubscribeTask(task_id));
-  } else {
-    // Check if the uncommitted remote lineage is too large.  Request a
-    // notification for every max_lineage_size_ tasks, so that the task and its
-    // uncommitted lineage can be evicted once the commit notification is
-    // received.  By doing this, we make sure that the unevicted lineage won't
-    // be more than max_lineage_size_, and the number of subscribed tasks won't
-    // be more than N / max_lineage_size_, where N is the size of the task
-    // chain.
-    // NOTE(swang): The number of entries in the uncommitted lineage also
-    // includes local tasks that haven't been committed yet, not just remote
-    // tasks, so this is an overestimate.
-    std::unordered_set<TaskID> seen;
-    auto count = CountUnsubscribedLineage(task_id, seen);
-    if (count >= max_lineage_size_) {
-      // Since this task was in state WAITING, check that we were not
-      // already subscribed to the task.
-      RAY_CHECK(SubscribeTask(task_id));
-    }
-  }
-  // The task was successfully reset to UNCOMMITTED_REMOTE.
+  // The task is now remote, so subscribe to the task to make sure that we'll
+  // eventually clean it up.
+  RAY_CHECK(SubscribeTask(task_id));
   return true;
 }
 
@@ -312,17 +299,37 @@ void LineageCache::MarkTaskAsForwarded(const TaskID &task_id, const ClientID &no
   lineage_.GetEntryMutable(task_id)->MarkExplicitlyForwarded(node_id);
 }
 
+/// A helper function to get the uncommitted lineage of a task.
+void GetUncommittedLineageHelper(const TaskID &task_id, const Lineage &lineage_from,
+                                 Lineage &lineage_to, const ClientID &node_id) {
+  // If the entry is not found in the lineage to merge, then we stop since
+  // there is nothing to copy into the merged lineage.
+  auto entry = lineage_from.GetEntry(task_id);
+  if (!entry) {
+    return;
+  }
+  // If this task has already been forwarded to this node, then we can stop.
+  if (entry->WasExplicitlyForwarded(node_id)) {
+    return;
+  }
+
+  // Insert a copy of the entry into lineage_to.  If the insert is successful,
+  // then continue the DFS. The insert will fail if the new entry has an equal
+  // or lower GCS status than the current entry in lineage_to. This also
+  // prevents us from traversing the same node twice.
+  if (lineage_to.SetEntry(entry->TaskData(), entry->GetStatus())) {
+    for (const auto &parent_id : entry->GetParentTaskIds()) {
+      GetUncommittedLineageHelper(parent_id, lineage_from, lineage_to, node_id);
+    }
+  }
+}
+
 Lineage LineageCache::GetUncommittedLineage(const TaskID &task_id,
                                             const ClientID &node_id) const {
   Lineage uncommitted_lineage;
   // Add all uncommitted ancestors from the lineage cache to the uncommitted
   // lineage of the requested task.
-  MergeLineageHelper(
-      task_id, lineage_, uncommitted_lineage, [&](const LineageEntry &entry) {
-        // The stopping condition for recursion is that the entry has
-        // been committed to the GCS or has already been forwarded.
-        return entry.WasExplicitlyForwarded(node_id);
-      });
+  GetUncommittedLineageHelper(task_id, lineage_, uncommitted_lineage, node_id);
   // The lineage always includes the requested task id, so add the task if it
   // wasn't already added. The requested task may not have been added if it was
   // already explicitly forwarded to this node before.
@@ -334,72 +341,29 @@ Lineage LineageCache::GetUncommittedLineage(const TaskID &task_id,
   return uncommitted_lineage;
 }
 
-bool LineageCache::FlushTask(const TaskID &task_id) {
-  auto entry = lineage_.GetEntry(task_id);
+void LineageCache::FlushTask(const TaskID &task_id) {
+  auto entry = lineage_.GetEntryMutable(task_id);
   RAY_CHECK(entry);
   RAY_CHECK(entry->GetStatus() == GcsStatus::UNCOMMITTED_READY);
 
-  // Check if all arguments have been committed to the GCS before writing
-  // this task.
-  bool all_arguments_committed = true;
-  for (const auto &parent_id : entry->GetParentTaskIds()) {
-    auto parent = lineage_.GetEntry(parent_id);
-    // If a parent entry exists in the lineage cache but has not been
-    // committed yet, then as far as we know, it's still in flight to the
-    // GCS. Skip this task for now.
-    if (parent) {
-      // Request notifications about the parent entry's commit in the GCS if
-      // the parent is remote. Otherwise, the parent is local and will
-      // eventually be flushed. In either case, once we receive a
-      // notification about the task's commit via HandleEntryCommitted, then
-      // this task will be ready to write on the next call to Flush().
-      if (parent->GetStatus() == GcsStatus::UNCOMMITTED_REMOTE) {
-        SubscribeTask(parent_id);
-      }
-      all_arguments_committed = false;
-      // Track the fact that this task is dependent on a parent that hasn't yet
-      // been committed, for fast lookup. Once all parents are committed, the
-      // child will be flushed.
-      uncommitted_ready_children_[parent_id].insert(task_id);
-    }
-  }
-  if (all_arguments_committed) {
-    gcs::raylet::TaskTable::WriteCallback task_callback = [this](
-        ray::gcs::AsyncGcsClient *client, const TaskID &id, const protocol::TaskT &data) {
-      HandleEntryCommitted(id);
-    };
-    auto task = lineage_.GetEntry(task_id);
-    // TODO(swang): Make this better...
-    flatbuffers::FlatBufferBuilder fbb;
-    auto message = task->TaskData().ToFlatbuffer(fbb);
-    fbb.Finish(message);
-    auto task_data = std::make_shared<protocol::TaskT>();
-    auto root = flatbuffers::GetRoot<protocol::Task>(fbb.GetBufferPointer());
-    root->UnPackTo(task_data.get());
-    RAY_CHECK_OK(task_storage_.Add(task->TaskData().GetTaskSpecification().DriverId(),
-                                   task_id, task_data, task_callback));
-
-    // We successfully wrote the task, so mark it as committing.
-    // TODO(swang): Use a batched interface and write with all object entries.
-    auto entry = lineage_.GetEntryMutable(task_id);
-    RAY_CHECK(entry);
-    RAY_CHECK(entry->SetStatus(GcsStatus::COMMITTING));
-  }
-  return all_arguments_committed;
-}
-
-void LineageCache::Flush() {
-  // Iterate through all tasks that are PLACEABLE.
-  for (auto it = uncommitted_ready_tasks_.begin();
-       it != uncommitted_ready_tasks_.end();) {
-    bool flushed = FlushTask(*it);
-    // Erase the task from the cache of uncommitted ready tasks.
-    if (flushed) {
-      it = uncommitted_ready_tasks_.erase(it);
-    } else {
-      it++;
-    }
-  }
+  gcs::raylet::TaskTable::WriteCallback task_callback = [this](
+      ray::gcs::AsyncGcsClient *client, const TaskID &id, const protocol::TaskT &data) {
+    HandleEntryCommitted(id);
+  };
+  auto task = lineage_.GetEntry(task_id);
+  // TODO(swang): Make this better...
+  flatbuffers::FlatBufferBuilder fbb;
+  auto message = task->TaskData().ToFlatbuffer(fbb);
+  fbb.Finish(message);
+  auto task_data = std::make_shared<protocol::TaskT>();
+  auto root = flatbuffers::GetRoot<protocol::Task>(fbb.GetBufferPointer());
+  root->UnPackTo(task_data.get());
+  RAY_CHECK_OK(task_storage_.Add(task->TaskData().GetTaskSpecification().DriverId(),
+                                 task_id, task_data, task_callback));
+
+  // We successfully wrote the task, so mark it as committing.
+  // TODO(swang): Use a batched interface and write with all object entries.
+  RAY_CHECK(entry->SetStatus(GcsStatus::COMMITTING));
 }
 
 bool LineageCache::SubscribeTask(const TaskID &task_id) {
@@ -429,81 +393,56 @@ bool LineageCache::UnsubscribeTask(const TaskID &task_id) {
   return subscribed;
 }
 
-boost::optional<LineageEntry> LineageCache::EvictTask(const TaskID &task_id) {
-  RAY_LOG(DEBUG) << "evicting task " << task_id << " on " << client_id_;
-  auto entry = lineage_.PopEntry(task_id);
-  if (!entry) {
-    // The entry has already been evicted. Check that the entry does not have
-    // any dependent tasks, since we should've already attempted to flush these
-    // tasks on the first eviction.
-    RAY_CHECK(uncommitted_ready_children_.count(task_id) == 0);
-    // Check that we already unsubscribed from the task when handling the
-    // first eviction.
-    RAY_CHECK(subscribed_tasks_.count(task_id) == 0);
-    // Do nothing if the entry has already been evicted.
-    return entry;
-  }
-
-  // Stop listening for notifications about this task.
-  UnsubscribeTask(task_id);
-
-  // Try to flush the children of the committed task. These are the tasks that
-  // have a dependency on the committed task.
-  auto children_entry = uncommitted_ready_children_.find(task_id);
-  if (children_entry != uncommitted_ready_children_.end()) {
-    // Get the children of the committed task that are uncommitted but ready.
-    auto children = std::move(children_entry->second);
-    uncommitted_ready_children_.erase(children_entry);
-
-    // Try to flush the children.  If all of the child's parents are committed,
-    // then the child will be flushed here.
-    for (const auto &child_id : children) {
-      bool flushed = FlushTask(child_id);
-      // Erase the child task from the cache of uncommitted ready tasks.
-      if (flushed) {
-        auto erased = uncommitted_ready_tasks_.erase(child_id);
-        RAY_CHECK(erased == 1);
-      }
-    }
+void LineageCache::EvictTask(const TaskID &task_id) {
+  // If we haven't received a commit for this task yet, do not evict.
+  auto commit_it = committed_tasks_.find(task_id);
+  if (commit_it == committed_tasks_.end()) {
+    return;
   }
-
-  return entry;
-}
-
-void LineageCache::EvictRemoteLineage(const TaskID &task_id) {
+  // If the entry has already been evicted, exit.
   auto entry = lineage_.GetEntry(task_id);
   if (!entry) {
     return;
   }
-  // Only evict tasks that are remote. Other tasks, and their lineage, will be
-  // evicted once they are committed.
-  if (entry->GetStatus() == GcsStatus::UNCOMMITTED_REMOTE) {
-    // Remove the ancestor task.
-    auto evicted_entry = EvictTask(task_id);
-    // Recurse and remove this task's ancestors.
-    for (const auto &parent_id : evicted_entry->GetParentTaskIds()) {
-      EvictRemoteLineage(parent_id);
+  // Only evict tasks that we were subscribed to or that we were committing.
+  if (!(entry->GetStatus() == GcsStatus::UNCOMMITTED_REMOTE ||
+        entry->GetStatus() == GcsStatus::COMMITTING)) {
+    return;
+  }
+  // Entries cannot be safely evicted until their parents are all evicted.
+  for (const auto &parent_id : entry->GetParentTaskIds()) {
+    if (ContainsTask(parent_id)) {
+      return;
     }
   }
+
+  // Evict the task.
+  RAY_LOG(DEBUG) << "evicting task " << task_id << " on " << client_id_;
+  lineage_.PopEntry(task_id);
+  committed_tasks_.erase(commit_it);
+  // Try to evict the children of the evict task. These are the tasks that have
+  // a dependency on the evicted task.
+  const auto children = lineage_.GetChildren(task_id);
+  for (const auto &child_id : children) {
+    EvictTask(child_id);
+  }
+
+  return;
 }
 
 void LineageCache::HandleEntryCommitted(const TaskID &task_id) {
   RAY_LOG(DEBUG) << "task committed: " << task_id;
-  auto entry = EvictTask(task_id);
+  auto entry = lineage_.GetEntry(task_id);
   if (!entry) {
-    // The task has already been evicted due to a previous commit notification,
-    // or because one of its descendants was committed.
+    // The task has already been evicted due to a previous commit notification.
     return;
   }
-
-  // Evict the committed task's uncommitted lineage. Since local tasks are
-  // written in data dependency order, the uncommitted lineage should only
-  // include remote tasks, i.e. tasks that were committed by a different node.
-  // In case of reconstruction, the uncommitted lineage may also include local
-  // tasks that were resubmitted. These tasks are not evicted.
-  for (const auto &parent_id : entry->GetParentTaskIds()) {
-    EvictRemoteLineage(parent_id);
-  }
+  // Record the commit acknowledgement and attempt to evict the task.
+  committed_tasks_.insert(task_id);
+  EvictTask(task_id);
+  // We got the notification about the task's commit, so no longer need any
+  // more notifications.
+  UnsubscribeTask(task_id);
 }
 
 const Task &LineageCache::GetTask(const TaskID &task_id) const {
@@ -519,6 +458,18 @@ bool LineageCache::ContainsTask(const TaskID &task_id) const {
   return it != entries.end();
 }
 
+const Lineage &LineageCache::GetLineage() const { return lineage_; }
+
+std::string LineageCache::DebugString() const {
+  std::stringstream result;
+  result << "LineageCache:";
+  result << "\n- committed tasks: " << committed_tasks_.size();
+  result << "\n- child map size: " << lineage_.GetChildrenSize();
+  result << "\n- num subscribed tasks: " << subscribed_tasks_.size();
+  result << "\n- lineage size: " << lineage_.GetEntries().size();
+  return result.str();
+}
+
 }  // namespace raylet
 
 }  // namespace ray
diff --git a/src/ray/raylet/lineage_cache.h b/src/ray/raylet/lineage_cache.h
index 14eba7a11b4fe..89ff84d6c278a 100644
--- a/src/ray/raylet/lineage_cache.h
+++ b/src/ray/raylet/lineage_cache.h
@@ -1,10 +1,11 @@
 #ifndef RAY_RAYLET_LINEAGE_CACHE_H
 #define RAY_RAYLET_LINEAGE_CACHE_H
 
+#include <gtest/gtest_prod.h>
 #include <boost/optional.hpp>
 
 // clang-format off
-#include "common_protocol.h"
+#include "ray/common/common_protocol.h"
 #include "ray/raylet/task.h"
 #include "ray/gcs/tables.h"
 #include "ray/id.h"
@@ -176,15 +177,41 @@ class Lineage {
   flatbuffers::Offset<protocol::ForwardTaskRequest> ToFlatbuffer(
       flatbuffers::FlatBufferBuilder &fbb, const TaskID &entry_id) const;
 
+  /// Return the IDs of tasks in the lineage that are dependent on the given
+  /// task.
+  ///
+  /// \param The ID of the task whose children to get.
+  /// \return The list of IDs for tasks that are in the lineage and dependent
+  /// on the given task.
+  const std::unordered_set<TaskID> &GetChildren(const TaskID &task_id) const;
+
+  /// Return the size of the children_ map. This is used for debugging purposes
+  /// only.
+  size_t GetChildrenSize() const { return children_.size(); }
+
  private:
   /// The lineage entries.
   std::unordered_map<const TaskID, LineageEntry> entries_;
+  /// A mapping from each task in the lineage to its children.
+  std::unordered_map<TaskID, std::unordered_set<TaskID>> children_;
+
+  /// Record the fact that the child task depends on the parent task.
+  void AddChild(const TaskID &parent_id, const TaskID &child_id);
+  /// Erase the fact that the child task depends on the parent task.
+  void RemoveChild(const TaskID &parent_id, const TaskID &child_id);
 };
 
 /// \class LineageCache
 ///
 /// A cache of the task table. This consists of all tasks that this node owns,
-/// as well as their lineage, that have not yet been added durably to the GCS.
+/// as well as their lineage, that have not yet been added durably
+/// ("committed") to the GCS.
+///
+/// The current policy is to flush each task as soon as it enters the
+/// UNCOMMITTED_READY state. For safety, we only evict tasks if they have been
+/// committed and if their parents have been all evicted. Thus, the invariant
+/// is that if g depends on f, and g has been evicted, then f must have been
+/// committed.
 class LineageCache {
  public:
   /// Create a lineage cache for the given task storage system.
@@ -242,15 +269,8 @@ class LineageCache {
   /// includes the entry for the requested entry_id.
   Lineage GetUncommittedLineage(const TaskID &task_id, const ClientID &node_id) const;
 
-  /// Asynchronously write any tasks that are in the UNCOMMITTED_READY state
-  /// and for which all parents have been committed to the GCS. These tasks
-  /// will be transitioned in this method to state COMMITTING. Once the write
-  /// is acknowledged, the task's state will be transitioned to state
-  /// COMMITTED.
-  void Flush();
-
-  /// Handle the commit of a task entry in the GCS. This sets the task to
-  /// COMMITTED and cleans up any ancestor tasks that are in the cache.
+  /// Handle the commit of a task entry in the GCS. This attempts to evict the
+  /// task if possible.
   ///
   /// \param task_id The ID of the task entry that was committed.
   void HandleEntryCommitted(const TaskID &task_id);
@@ -267,35 +287,34 @@ class LineageCache {
   /// \return Whether the task is in the lineage cache.
   bool ContainsTask(const TaskID &task_id) const;
 
+  /// Get all lineage in the lineage cache.
+  ///
+  /// \return A const reference to the lineage.
+  const Lineage &GetLineage() const;
+
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  private:
-  /// Try to flush a task that is in UNCOMMITTED_READY state. If the task has
-  /// parents that are not committed yet, then the child will be flushed once
-  /// the parents have been committed.
-  bool FlushTask(const TaskID &task_id);
+  FRIEND_TEST(LineageCacheTest, BarReturnsZeroOnNull);
+  /// Flush a task that is in UNCOMMITTED_READY state.
+  void FlushTask(const TaskID &task_id);
   /// Evict a single task. This should only be called if we are sure that the
-  /// task has been committed and will trigger an attempt to flush any of the
-  /// evicted task's children that are in UNCOMMITTED_READY state.  Returns an
-  /// optional reference to the evicted task that is empty if the task was not
-  /// in the lineage cache.
-  boost::optional<LineageEntry> EvictTask(const TaskID &task_id);
-  /// Evict a remote task and its lineage. This should only be called if we
-  /// are sure that the remote task and its lineage are committed.
-  void EvictRemoteLineage(const TaskID &task_id);
+  /// task has been committed. The task will only be evicted if all of its
+  /// parents have also been evicted. If successful, then we will also attempt
+  /// to evict the task's children.
+  void EvictTask(const TaskID &task_id);
   /// Subscribe to notifications for a task. Returns whether the operation
   /// was successful (whether we were not already subscribed).
   bool SubscribeTask(const TaskID &task_id);
   /// Unsubscribe from notifications for a task. Returns whether the operation
   /// was successful (whether we were subscribed).
   bool UnsubscribeTask(const TaskID &task_id);
-  /// Count the size of unsubscribed and uncommitted lineage of the given task
-  /// excluding the values that have already been visited.
-  ///
-  /// \param task_id The task whose lineage should be counted.
-  /// \param seen This set contains the keys of lineage entries counted so far,
-  /// so that we don't revisit those nodes.
-  /// \void The number of tasks that were counted.
-  uint64_t CountUnsubscribedLineage(const TaskID &task_id,
-                                    std::unordered_set<TaskID> &seen) const;
+  /// Add a task and its uncommitted lineage to the local stash.
+  void AddUncommittedLineage(const TaskID &task_id, const Lineage &uncommitted_lineage,
+                             std::unordered_set<TaskID> &subscribe_tasks);
 
   /// The client ID, used to request notifications for specific tasks.
   /// TODO(swang): Move the ClientID into the generic Table implementation.
@@ -305,23 +324,8 @@ class LineageCache {
   /// The pubsub storage system for task information. This can be used to
   /// request notifications for the commit of a task entry.
   gcs::PubsubInterface<TaskID> &task_pubsub_;
-  /// The maximum size that a remote task's uncommitted lineage can get to. If
-  /// a remote task's uncommitted lineage exceeds this size, then a
-  /// notification will be requested from the pubsub storage system so that
-  /// the task and its lineage can be evicted from the stash.
-  uint64_t max_lineage_size_;
-  /// The set of tasks that are in UNCOMMITTED_READY state. This is a cache of
-  /// the tasks that may be flushable.
-  // TODO(swang): As an optimization, we may also want to further distinguish
-  // which tasks are flushable, to avoid iterating over tasks that are in
-  // UNCOMMITTED_READY, but that have dependencies that have not been committed
-  // yet.
-  std::unordered_set<TaskID> uncommitted_ready_tasks_;
-  /// A mapping from each task that hasn't been committed yet, to all dependent
-  /// children tasks that are in UNCOMMITTED_READY state. This is used when the
-  /// parent task is committed, for fast lookup of children that may now be
-  /// flushed.
-  std::unordered_map<TaskID, std::unordered_set<TaskID>> uncommitted_ready_children_;
+  /// The set of tasks that have been committed but not evicted.
+  std::unordered_set<TaskID> committed_tasks_;
   /// All tasks and objects that we are responsible for writing back to the
   /// GCS, and the tasks and objects in their lineage.
   Lineage lineage_;
diff --git a/src/ray/raylet/lineage_cache_test.cc b/src/ray/raylet/lineage_cache_test.cc
index 10081fdc8aa35..edfb0db69f597 100644
--- a/src/ray/raylet/lineage_cache_test.cc
+++ b/src/ray/raylet/lineage_cache_test.cc
@@ -221,12 +221,6 @@ TEST_F(LineageCacheTest, TestMarkTaskAsForwarded) {
   ASSERT_EQ(1, uncommitted_lineage_forwarded.GetEntries().size());
 }
 
-void CheckFlush(LineageCache &lineage_cache, MockGcs &mock_gcs,
-                size_t num_tasks_flushed) {
-  lineage_cache.Flush();
-  ASSERT_EQ(mock_gcs.TaskTable().size(), num_tasks_flushed);
-}
-
 TEST_F(LineageCacheTest, TestWritebackNoneReady) {
   // Insert a chain of dependent tasks.
   size_t num_tasks_flushed = 0;
@@ -235,7 +229,7 @@ TEST_F(LineageCacheTest, TestWritebackNoneReady) {
 
   // Check that when no tasks have been marked as ready, we do not flush any
   // entries.
-  CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
+  ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
 }
 
 TEST_F(LineageCacheTest, TestWritebackReady) {
@@ -247,69 +241,126 @@ TEST_F(LineageCacheTest, TestWritebackReady) {
   // Check that after marking the first task as ready, we flush only that task.
   ASSERT_TRUE(lineage_cache_.AddReadyTask(tasks.front()));
   num_tasks_flushed++;
-  CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
+  ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
 }
 
 TEST_F(LineageCacheTest, TestWritebackOrder) {
   // Insert a chain of dependent tasks.
-  size_t num_tasks_flushed = 0;
   std::vector<Task> tasks;
   InsertTaskChain(lineage_cache_, tasks, 3, std::vector<ObjectID>(), 1);
+  size_t num_tasks_flushed = tasks.size();
 
-  // Mark all tasks as ready. The first task, which has no dependencies, should
-  // be flushed.
+  // Mark all tasks as ready. All tasks should be flushed.
   for (const auto &task : tasks) {
     ASSERT_TRUE(lineage_cache_.AddReadyTask(task));
   }
-  // Check that we write back the tasks in order of data dependencies.
-  for (size_t i = 0; i < tasks.size(); i++) {
-    num_tasks_flushed++;
-    ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
-    // Flush acknowledgements. The next task should have been flushed.
-    mock_gcs_.Flush();
-  }
+
+  ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
 }
 
-TEST_F(LineageCacheTest, TestWritebackPartiallyReady) {
-  // Create two independent tasks, task1 and task2, and a dependent task
-  // that depends on both tasks.
+TEST_F(LineageCacheTest, TestEvictChain) {
+  // Create a chain of 3 tasks.
   size_t num_tasks_flushed = 0;
-  auto task1 = ExampleTask({}, 1);
-  auto task2 = ExampleTask({}, 1);
-  std::vector<ObjectID> returns;
-  for (int64_t i = 0; i < task1.GetTaskSpecification().NumReturns(); i++) {
-    returns.push_back(task1.GetTaskSpecification().ReturnId(i));
-  }
-  for (int64_t i = 0; i < task2.GetTaskSpecification().NumReturns(); i++) {
-    returns.push_back(task2.GetTaskSpecification().ReturnId(i));
+  std::vector<Task> tasks;
+  std::vector<ObjectID> arguments;
+  for (int i = 0; i < 3; i++) {
+    auto task = ExampleTask(arguments, 1);
+    tasks.push_back(task);
+    arguments = {task.GetTaskSpecification().ReturnId(0)};
   }
-  auto dependent_task = ExampleTask(returns, 1);
 
-  // Insert all tasks as waiting for execution.
-  ASSERT_TRUE(lineage_cache_.AddWaitingTask(task1, Lineage()));
-  ASSERT_TRUE(lineage_cache_.AddWaitingTask(task2, Lineage()));
-  ASSERT_TRUE(lineage_cache_.AddWaitingTask(dependent_task, Lineage()));
-
-  // Flush one of the independent tasks.
-  ASSERT_TRUE(lineage_cache_.AddReadyTask(task1));
+  Lineage uncommitted_lineage;
+  for (const auto &task : tasks) {
+    uncommitted_lineage.SetEntry(task, GcsStatus::UNCOMMITTED_REMOTE);
+  }
+  // Mark the last task as ready to flush.
+  ASSERT_TRUE(lineage_cache_.AddWaitingTask(tasks.back(), uncommitted_lineage));
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), tasks.size());
+  ASSERT_TRUE(lineage_cache_.AddReadyTask(tasks.back()));
   num_tasks_flushed++;
-  CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
+  ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
   // Flush acknowledgements. The lineage cache should receive the commit for
-  // the first task.
+  // the flushed task, but its lineage should not be evicted yet.
   mock_gcs_.Flush();
-  // Mark the other independent task and the dependent as ready.
-  ASSERT_TRUE(lineage_cache_.AddReadyTask(task2));
-  ASSERT_TRUE(lineage_cache_.AddReadyTask(dependent_task));
-  // Two tasks are ready, but only the independent task should be flushed. The
-  // dependent task should only be flushed once commits for both independent
-  // tasks are received.
-  num_tasks_flushed++;
-  CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
-  // Flush acknowledgements. Both independent tasks should now be committed.
+  ASSERT_EQ(lineage_cache_
+                .GetUncommittedLineage(tasks.back().GetTaskSpecification().TaskId(),
+                                       ClientID::nil())
+                .GetEntries()
+                .size(),
+            tasks.size());
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), tasks.size());
+
+  // Simulate executing the task on a remote node and adding it to the GCS.
+  auto task_data = std::make_shared<protocol::TaskT>();
+  RAY_CHECK_OK(
+      mock_gcs_.RemoteAdd(tasks.at(1).GetTaskSpecification().TaskId(), task_data));
   mock_gcs_.Flush();
-  // The dependent task should now be flushed.
-  num_tasks_flushed++;
-  ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
+  ASSERT_EQ(lineage_cache_
+                .GetUncommittedLineage(tasks.back().GetTaskSpecification().TaskId(),
+                                       ClientID::nil())
+                .GetEntries()
+                .size(),
+            tasks.size());
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), tasks.size());
+
+  // Simulate executing the task on a remote node and adding it to the GCS.
+  RAY_CHECK_OK(
+      mock_gcs_.RemoteAdd(tasks.at(0).GetTaskSpecification().TaskId(), task_data));
+  mock_gcs_.Flush();
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), 0);
+  ASSERT_EQ(lineage_cache_.GetLineage().GetChildrenSize(), 0);
+}
+
+TEST_F(LineageCacheTest, TestEvictManyParents) {
+  // Create some independent tasks.
+  std::vector<Task> parent_tasks;
+  std::vector<ObjectID> arguments;
+  for (int i = 0; i < 10; i++) {
+    auto task = ExampleTask({}, 1);
+    parent_tasks.push_back(task);
+    arguments.push_back(task.GetTaskSpecification().ReturnId(0));
+    ASSERT_TRUE(lineage_cache_.AddWaitingTask(task, Lineage()));
+  }
+  // Create a child task that is dependent on all of the previous tasks.
+  auto child_task = ExampleTask(arguments, 1);
+  ASSERT_TRUE(lineage_cache_.AddWaitingTask(child_task, Lineage()));
+
+  // Flush the child task. Make sure that it remains in the cache, since none
+  // of its parents have been committed yet, and that the uncommitted lineage
+  // still includes all of the parent tasks.
+  size_t total_tasks = parent_tasks.size() + 1;
+  lineage_cache_.AddReadyTask(child_task);
+  mock_gcs_.Flush();
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), total_tasks);
+  ASSERT_EQ(lineage_cache_
+                .GetUncommittedLineage(child_task.GetTaskSpecification().TaskId(),
+                                       ClientID::nil())
+                .GetEntries()
+                .size(),
+            total_tasks);
+
+  // Flush each parent task and check for eviction safety.
+  for (const auto &parent_task : parent_tasks) {
+    lineage_cache_.AddReadyTask(parent_task);
+    mock_gcs_.Flush();
+    total_tasks--;
+    if (total_tasks > 1) {
+      // Each task should be evicted as soon as its commit is acknowledged,
+      // since the parent tasks have no dependencies.
+      ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), total_tasks);
+      ASSERT_EQ(lineage_cache_
+                    .GetUncommittedLineage(child_task.GetTaskSpecification().TaskId(),
+                                           ClientID::nil())
+                    .GetEntries()
+                    .size(),
+                total_tasks);
+    } else {
+      // After the last task has been committed, then the child task should
+      // also be evicted. The lineage cache should now be empty.
+      ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), 0);
+    }
+  }
+  ASSERT_EQ(lineage_cache_.GetLineage().GetChildrenSize(), 0);
 }
 
 TEST_F(LineageCacheTest, TestForwardTasksRoundTrip) {
@@ -350,16 +401,19 @@ TEST_F(LineageCacheTest, TestForwardTask) {
   auto uncommitted_lineage =
       lineage_cache_.GetUncommittedLineage(task_id_to_remove, ClientID::nil());
   ASSERT_TRUE(lineage_cache_.RemoveWaitingTask(task_id_to_remove));
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), 3);
 
   // Simulate executing the remaining tasks.
   for (const auto &task : tasks) {
     ASSERT_TRUE(lineage_cache_.AddReadyTask(task));
+    num_tasks_flushed++;
   }
   // Check that the first task, which has no dependencies can be flushed. The
   // last task cannot be flushed since one of its dependencies has not been
   // added by the remote node yet.
-  num_tasks_flushed++;
-  CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
+  ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
+  mock_gcs_.Flush();
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), 2);
 
   // Simulate executing the task on a remote node and adding it to the GCS.
   auto task_data = std::make_shared<protocol::TaskT>();
@@ -367,15 +421,15 @@ TEST_F(LineageCacheTest, TestForwardTask) {
       mock_gcs_.RemoteAdd(forwarded_task.GetTaskSpecification().TaskId(), task_data));
   // Check that the remote task is flushed.
   num_tasks_flushed++;
-  CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
+  ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
   ASSERT_EQ(mock_gcs_.SubscribedTasks().size(), 1);
 
   // Check that once we receive the callback for the remote task, we can now
   // flush the last task.
   mock_gcs_.Flush();
-  num_tasks_flushed++;
-  CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
   ASSERT_EQ(mock_gcs_.SubscribedTasks().size(), 0);
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), 0);
+  ASSERT_EQ(lineage_cache_.GetLineage().GetChildrenSize(), 0);
 }
 
 TEST_F(LineageCacheTest, TestEviction) {
@@ -407,10 +461,12 @@ TEST_F(LineageCacheTest, TestEviction) {
   // Check that the remote task is flushed.
   num_tasks_flushed++;
   mock_gcs_.Flush();
-  CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
+  ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
   // Check that the last task in the chain still has all tasks in its
   // uncommitted lineage.
   ASSERT_EQ(uncommitted_lineage.GetEntries().size(), lineage_size);
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(),
+            lineage_size - num_tasks_flushed);
 
   // Simulate executing all the rest of the tasks except the last one on a
   // remote node and adding them to the GCS.
@@ -420,7 +476,9 @@ TEST_F(LineageCacheTest, TestEviction) {
     // Check that the remote task is flushed.
     num_tasks_flushed++;
     mock_gcs_.Flush();
-    CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
+    ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
+    ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(),
+              lineage_size - num_tasks_flushed);
   }
   // All tasks have now been flushed. Check that enough lineage has been
   // evicted that the uncommitted lineage is now less than the maximum size.
@@ -429,6 +487,7 @@ TEST_F(LineageCacheTest, TestEviction) {
   ASSERT_TRUE(uncommitted_lineage.GetEntries().size() < max_lineage_size_);
   // The remaining task should have no uncommitted lineage.
   ASSERT_EQ(uncommitted_lineage.GetEntries().size(), 1);
+  ASSERT_EQ(lineage_cache_.GetLineage().GetChildrenSize(), 1);
 }
 
 TEST_F(LineageCacheTest, TestOutOfOrderEviction) {
@@ -445,8 +504,6 @@ TEST_F(LineageCacheTest, TestOutOfOrderEviction) {
     auto task_id = task.GetTaskSpecification().TaskId();
     ASSERT_TRUE(lineage_cache_.RemoveWaitingTask(task_id));
   }
-  // Check that we requested at most 2 notifications
-  ASSERT_TRUE(mock_gcs_.NumRequestedNotifications() <= 2);
 
   // Check that the last task in the chain still has all tasks in its
   // uncommitted lineage.
@@ -454,37 +511,30 @@ TEST_F(LineageCacheTest, TestOutOfOrderEviction) {
   auto uncommitted_lineage =
       lineage_cache_.GetUncommittedLineage(last_task_id, ClientID::nil());
   ASSERT_EQ(uncommitted_lineage.GetEntries().size(), lineage_size);
-
-  // Simulate executing all the rest of the tasks except the last one at the
-  // remote node. Simulate receiving the notifications from the GCS in reverse
-  // order of execution.
-  tasks.pop_back();
-  auto task_data = std::make_shared<protocol::TaskT>();
-  auto it = tasks.rbegin();
-  RAY_CHECK_OK(mock_gcs_.RemoteAdd(it->GetTaskSpecification().TaskId(), task_data));
-  it++;
-  // Check that the remote task is flushed.
-  num_tasks_flushed++;
-  mock_gcs_.Flush();
-  CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
-  // Check that the last task in the chain still has all tasks in its
-  // uncommitted lineage.
-  ASSERT_EQ(uncommitted_lineage.GetEntries().size(), lineage_size);
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), lineage_size);
 
   // Simulate executing the rest of the tasks on a remote node and receiving
   // the notifications from the GCS in reverse order of execution.
-  for (; it != tasks.rend(); it++) {
+  auto last_task = tasks.front();
+  tasks.erase(tasks.begin());
+  for (auto it = tasks.rbegin(); it != tasks.rend(); it++) {
+    auto task_data = std::make_shared<protocol::TaskT>();
     RAY_CHECK_OK(mock_gcs_.RemoteAdd(it->GetTaskSpecification().TaskId(), task_data));
     // Check that the remote task is flushed.
     num_tasks_flushed++;
     mock_gcs_.Flush();
-    CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
+    ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
+    ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), lineage_size);
   }
-  // All tasks have now been flushed. Check that enough lineage has been
-  // evicted that the uncommitted lineage is now less than the maximum size.
-  uncommitted_lineage =
-      lineage_cache_.GetUncommittedLineage(last_task_id, ClientID::nil());
-  ASSERT_TRUE(uncommitted_lineage.GetEntries().size() < max_lineage_size_);
+  // Flush the last task. The lineage should not get evicted until this task's
+  // commit is received.
+  auto task_data = std::make_shared<protocol::TaskT>();
+  RAY_CHECK_OK(mock_gcs_.RemoteAdd(last_task.GetTaskSpecification().TaskId(), task_data));
+  num_tasks_flushed++;
+  mock_gcs_.Flush();
+  ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), 0);
+  ASSERT_EQ(lineage_cache_.GetLineage().GetChildrenSize(), 0);
 }
 
 TEST_F(LineageCacheTest, TestEvictionUncommittedChildren) {
@@ -513,18 +563,22 @@ TEST_F(LineageCacheTest, TestEvictionUncommittedChildren) {
     num_tasks_flushed++;
   }
 
-  // Simulate executing the last task on a remote node and adding it to the
-  // GCS.
-  auto task_data = std::make_shared<protocol::TaskT>();
-  auto it = tasks.rbegin();
-  RAY_CHECK_OK(mock_gcs_.RemoteAdd(it->GetTaskSpecification().TaskId(), task_data));
-  // We expect the task that was added remotely to be flushed.
-  num_tasks_flushed++;
-  // Check that once the last task in the forwarded chain is flushed, all local
-  // tasks are flushed, since all of their dependencies have been evicted and
-  // are therefore committed in the GCS.
-  mock_gcs_.Flush();
-  CheckFlush(lineage_cache_, mock_gcs_, num_tasks_flushed);
+  // Simulate executing the tasks on the remote node in reverse order and
+  // adding them to the GCS. Lineage at the local node should not get evicted
+  // until after the final remote task is executed, since a task can only be
+  // evicted once all of its ancestors have been committed.
+  for (auto it = tasks.rbegin(); it != tasks.rend(); it++) {
+    auto task_data = std::make_shared<protocol::TaskT>();
+    ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), lineage_size * 2);
+    RAY_CHECK_OK(mock_gcs_.RemoteAdd(it->GetTaskSpecification().TaskId(), task_data));
+    num_tasks_flushed++;
+    mock_gcs_.Flush();
+    ASSERT_EQ(mock_gcs_.TaskTable().size(), num_tasks_flushed);
+  }
+  // Check that after the final remote task is executed, all local lineage is
+  // now evicted.
+  ASSERT_EQ(lineage_cache_.GetLineage().GetEntries().size(), 0);
+  ASSERT_EQ(lineage_cache_.GetLineage().GetChildrenSize(), 0);
 }
 
 }  // namespace raylet
diff --git a/src/ray/raylet/local_scheduler_client.cc b/src/ray/raylet/local_scheduler_client.cc
new file mode 100644
index 0000000000000..584379090117c
--- /dev/null
+++ b/src/ray/raylet/local_scheduler_client.cc
@@ -0,0 +1,414 @@
+#include "local_scheduler_client.h"
+
+#include <inttypes.h>
+#include <netdb.h>
+#include <netinet/in.h>
+#include <stdarg.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <sys/ioctl.h>
+#include <sys/socket.h>
+#include <sys/types.h>
+#include <sys/un.h>
+#include <unistd.h>
+
+#include "ray/common/common_protocol.h"
+#include "ray/ray_config.h"
+#include "ray/raylet/format/node_manager_generated.h"
+#include "ray/raylet/task_spec.h"
+#include "ray/util/logging.h"
+
+using MessageType = ray::protocol::MessageType;
+
+// TODO(rkn): The io methods below should be removed.
+
+int connect_ipc_sock(const char *socket_pathname) {
+  struct sockaddr_un socket_address;
+  int socket_fd;
+
+  socket_fd = socket(AF_UNIX, SOCK_STREAM, 0);
+  if (socket_fd < 0) {
+    RAY_LOG(ERROR) << "socket() failed for pathname " << socket_pathname;
+    return -1;
+  }
+
+  memset(&socket_address, 0, sizeof(socket_address));
+  socket_address.sun_family = AF_UNIX;
+  if (strlen(socket_pathname) + 1 > sizeof(socket_address.sun_path)) {
+    RAY_LOG(ERROR) << "Socket pathname is too long.";
+    return -1;
+  }
+  strncpy(socket_address.sun_path, socket_pathname, strlen(socket_pathname) + 1);
+
+  if (connect(socket_fd, (struct sockaddr *)&socket_address, sizeof(socket_address)) !=
+      0) {
+    close(socket_fd);
+    return -1;
+  }
+
+  return socket_fd;
+}
+
+int connect_ipc_sock_retry(const char *socket_pathname, int num_retries,
+                           int64_t timeout) {
+  /* Pick the default values if the user did not specify. */
+  if (num_retries < 0) {
+    num_retries = RayConfig::instance().num_connect_attempts();
+  }
+  if (timeout < 0) {
+    timeout = RayConfig::instance().connect_timeout_milliseconds();
+  }
+
+  RAY_CHECK(socket_pathname);
+  int fd = -1;
+  for (int num_attempts = 0; num_attempts < num_retries; ++num_attempts) {
+    fd = connect_ipc_sock(socket_pathname);
+    if (fd >= 0) {
+      break;
+    }
+    if (num_attempts > 0) {
+      RAY_LOG(ERROR) << "Retrying to connect to socket for pathname " << socket_pathname
+                     << " (num_attempts = " << num_attempts
+                     << ", num_retries = " << num_retries << ")";
+    }
+    /* Sleep for timeout milliseconds. */
+    usleep(timeout * 1000);
+  }
+  /* If we could not connect to the socket, exit. */
+  if (fd == -1) {
+    RAY_LOG(FATAL) << "Could not connect to socket " << socket_pathname;
+  }
+  return fd;
+}
+
+int read_bytes(int fd, uint8_t *cursor, size_t length) {
+  ssize_t nbytes = 0;
+  /* Termination condition: EOF or read 'length' bytes total. */
+  size_t bytesleft = length;
+  size_t offset = 0;
+  while (bytesleft > 0) {
+    nbytes = read(fd, cursor + offset, bytesleft);
+    if (nbytes < 0) {
+      if (errno == EAGAIN || errno == EWOULDBLOCK || errno == EINTR) {
+        continue;
+      }
+      return -1; /* Errno will be set. */
+    } else if (0 == nbytes) {
+      /* Encountered early EOF. */
+      return -1;
+    }
+    RAY_CHECK(nbytes > 0);
+    bytesleft -= nbytes;
+    offset += nbytes;
+  }
+
+  return 0;
+}
+
+void read_message(int fd, int64_t *type, int64_t *length, uint8_t **bytes) {
+  int64_t version;
+  int closed = read_bytes(fd, (uint8_t *)&version, sizeof(version));
+  if (closed) {
+    goto disconnected;
+  }
+  RAY_CHECK(version == RayConfig::instance().ray_protocol_version());
+  closed = read_bytes(fd, (uint8_t *)type, sizeof(*type));
+  if (closed) {
+    goto disconnected;
+  }
+  closed = read_bytes(fd, (uint8_t *)length, sizeof(*length));
+  if (closed) {
+    goto disconnected;
+  }
+  *bytes = (uint8_t *)malloc(*length * sizeof(uint8_t));
+  closed = read_bytes(fd, *bytes, *length);
+  if (closed) {
+    free(*bytes);
+    goto disconnected;
+  }
+  return;
+
+disconnected:
+  /* Handle the case in which the socket is closed. */
+  *type = static_cast<int64_t>(MessageType::DisconnectClient);
+  *length = 0;
+  *bytes = NULL;
+  return;
+}
+
+int write_bytes(int fd, uint8_t *cursor, size_t length) {
+  ssize_t nbytes = 0;
+  size_t bytesleft = length;
+  size_t offset = 0;
+  while (bytesleft > 0) {
+    /* While we haven't written the whole message, write to the file
+     * descriptor, advance the cursor, and decrease the amount left to write. */
+    nbytes = write(fd, cursor + offset, bytesleft);
+    if (nbytes < 0) {
+      if (errno == EAGAIN || errno == EWOULDBLOCK || errno == EINTR) {
+        continue;
+      }
+      return -1; /* Errno will be set. */
+    } else if (0 == nbytes) {
+      /* Encountered early EOF. */
+      return -1;
+    }
+    RAY_CHECK(nbytes > 0);
+    bytesleft -= nbytes;
+    offset += nbytes;
+  }
+
+  return 0;
+}
+
+int do_write_message(int fd, int64_t type, int64_t length, uint8_t *bytes) {
+  int64_t version = RayConfig::instance().ray_protocol_version();
+  int closed;
+  closed = write_bytes(fd, (uint8_t *)&version, sizeof(version));
+  if (closed) {
+    return closed;
+  }
+  closed = write_bytes(fd, (uint8_t *)&type, sizeof(type));
+  if (closed) {
+    return closed;
+  }
+  closed = write_bytes(fd, (uint8_t *)&length, sizeof(length));
+  if (closed) {
+    return closed;
+  }
+  closed = write_bytes(fd, bytes, length * sizeof(char));
+  if (closed) {
+    return closed;
+  }
+  return 0;
+}
+
+int write_message(int fd, int64_t type, int64_t length, uint8_t *bytes,
+                  std::mutex *mutex) {
+  if (mutex != NULL) {
+    std::unique_lock<std::mutex> guard(*mutex);
+    return do_write_message(fd, type, length, bytes);
+  } else {
+    return do_write_message(fd, type, length, bytes);
+  }
+}
+
+LocalSchedulerConnection *LocalSchedulerConnection_init(
+    const char *local_scheduler_socket, const UniqueID &client_id, bool is_worker,
+    const JobID &driver_id, const Language &language) {
+  LocalSchedulerConnection *result = new LocalSchedulerConnection();
+  result->conn = connect_ipc_sock_retry(local_scheduler_socket, -1, -1);
+
+  /* Register with the local scheduler.
+   * NOTE(swang): If the local scheduler exits and we are registered as a
+   * worker, we will get killed. */
+  flatbuffers::FlatBufferBuilder fbb;
+  auto message = ray::protocol::CreateRegisterClientRequest(
+      fbb, is_worker, to_flatbuf(fbb, client_id), getpid(), to_flatbuf(fbb, driver_id),
+      language);
+  fbb.Finish(message);
+  /* Register the process ID with the local scheduler. */
+  int success = write_message(
+      result->conn, static_cast<int64_t>(MessageType::RegisterClientRequest),
+      fbb.GetSize(), fbb.GetBufferPointer(), &result->write_mutex);
+  RAY_CHECK(success == 0) << "Unable to register worker with local scheduler";
+
+  return result;
+}
+
+void LocalSchedulerConnection_free(LocalSchedulerConnection *conn) {
+  close(conn->conn);
+  delete conn;
+}
+
+void local_scheduler_disconnect_client(LocalSchedulerConnection *conn) {
+  flatbuffers::FlatBufferBuilder fbb;
+  auto message = ray::protocol::CreateDisconnectClient(fbb);
+  fbb.Finish(message);
+  write_message(conn->conn,
+                static_cast<int64_t>(MessageType::IntentionalDisconnectClient),
+                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
+}
+
+void local_scheduler_submit_raylet(LocalSchedulerConnection *conn,
+                                   const std::vector<ObjectID> &execution_dependencies,
+                                   const ray::raylet::TaskSpecification &task_spec) {
+  flatbuffers::FlatBufferBuilder fbb;
+  auto execution_dependencies_message = to_flatbuf(fbb, execution_dependencies);
+  auto message = ray::protocol::CreateSubmitTaskRequest(
+      fbb, execution_dependencies_message, task_spec.ToFlatbuffer(fbb));
+  fbb.Finish(message);
+  write_message(conn->conn, static_cast<int64_t>(MessageType::SubmitTask), fbb.GetSize(),
+                fbb.GetBufferPointer(), &conn->write_mutex);
+}
+
+ray::raylet::TaskSpecification *local_scheduler_get_task_raylet(
+    LocalSchedulerConnection *conn) {
+  int64_t type;
+  int64_t reply_size;
+  uint8_t *reply;
+  {
+    std::unique_lock<std::mutex> guard(conn->mutex);
+    write_message(conn->conn, static_cast<int64_t>(MessageType::GetTask), 0, NULL,
+                  &conn->write_mutex);
+    // Receive a task from the local scheduler. This will block until the local
+    // scheduler gives this client a task.
+    read_message(conn->conn, &type, &reply_size, &reply);
+  }
+  if (type == static_cast<int64_t>(MessageType::DisconnectClient)) {
+    RAY_LOG(DEBUG) << "Exiting because local scheduler closed connection.";
+    exit(1);
+  }
+  if (type != static_cast<int64_t>(MessageType::ExecuteTask)) {
+    RAY_LOG(FATAL) << "Problem communicating with raylet from worker: check logs or "
+                      "dmesg for previous errors.";
+  }
+
+  // Parse the flatbuffer object.
+  auto reply_message = flatbuffers::GetRoot<ray::protocol::GetTaskReply>(reply);
+
+  // Set the resource IDs for this task.
+  conn->resource_ids_.clear();
+  for (size_t i = 0; i < reply_message->fractional_resource_ids()->size(); ++i) {
+    auto const &fractional_resource_ids =
+        reply_message->fractional_resource_ids()->Get(i);
+    auto &acquired_resources = conn->resource_ids_[string_from_flatbuf(
+        *fractional_resource_ids->resource_name())];
+
+    size_t num_resource_ids = fractional_resource_ids->resource_ids()->size();
+    size_t num_resource_fractions = fractional_resource_ids->resource_fractions()->size();
+    RAY_CHECK(num_resource_ids == num_resource_fractions);
+    RAY_CHECK(num_resource_ids > 0);
+    for (size_t j = 0; j < num_resource_ids; ++j) {
+      int64_t resource_id = fractional_resource_ids->resource_ids()->Get(j);
+      double resource_fraction = fractional_resource_ids->resource_fractions()->Get(j);
+      if (num_resource_ids > 1) {
+        int64_t whole_fraction = resource_fraction;
+        RAY_CHECK(whole_fraction == resource_fraction);
+      }
+      acquired_resources.push_back(std::make_pair(resource_id, resource_fraction));
+    }
+  }
+
+  ray::raylet::TaskSpecification *task_spec = new ray::raylet::TaskSpecification(
+      string_from_flatbuf(*reply_message->task_spec()));
+
+  // Free the original message from the local scheduler.
+  free(reply);
+
+  // Return the copy of the task spec and pass ownership to the caller.
+  return task_spec;
+}
+
+void local_scheduler_task_done(LocalSchedulerConnection *conn) {
+  write_message(conn->conn, static_cast<int64_t>(MessageType::TaskDone), 0, NULL,
+                &conn->write_mutex);
+}
+
+int local_scheduler_fetch_or_reconstruct(LocalSchedulerConnection *conn,
+                                         const std::vector<ObjectID> &object_ids,
+                                         bool fetch_only, const TaskID &current_task_id) {
+  flatbuffers::FlatBufferBuilder fbb;
+  auto object_ids_message = to_flatbuf(fbb, object_ids);
+  auto message = ray::protocol::CreateFetchOrReconstruct(
+      fbb, object_ids_message, fetch_only, to_flatbuf(fbb, current_task_id));
+  fbb.Finish(message);
+  return write_message(conn->conn, static_cast<int64_t>(MessageType::FetchOrReconstruct),
+                       fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
+}
+
+void local_scheduler_notify_unblocked(LocalSchedulerConnection *conn,
+                                      const TaskID &current_task_id) {
+  flatbuffers::FlatBufferBuilder fbb;
+  auto message =
+      ray::protocol::CreateNotifyUnblocked(fbb, to_flatbuf(fbb, current_task_id));
+  fbb.Finish(message);
+  write_message(conn->conn, static_cast<int64_t>(MessageType::NotifyUnblocked),
+                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
+}
+
+std::pair<std::vector<ObjectID>, std::vector<ObjectID>> local_scheduler_wait(
+    LocalSchedulerConnection *conn, const std::vector<ObjectID> &object_ids,
+    int num_returns, int64_t timeout_milliseconds, bool wait_local,
+    const TaskID &current_task_id) {
+  // Write request.
+  flatbuffers::FlatBufferBuilder fbb;
+  auto message = ray::protocol::CreateWaitRequest(
+      fbb, to_flatbuf(fbb, object_ids), num_returns, timeout_milliseconds, wait_local,
+      to_flatbuf(fbb, current_task_id));
+  fbb.Finish(message);
+  int64_t type;
+  int64_t reply_size;
+  uint8_t *reply;
+  {
+    std::unique_lock<std::mutex> guard(conn->mutex);
+    write_message(conn->conn,
+                  static_cast<int64_t>(ray::protocol::MessageType::WaitRequest),
+                  fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
+    // Read result.
+    read_message(conn->conn, &type, &reply_size, &reply);
+  }
+  if (static_cast<ray::protocol::MessageType>(type) !=
+      ray::protocol::MessageType::WaitReply) {
+    RAY_LOG(FATAL) << "Problem communicating with raylet from worker: check logs or "
+                      "dmesg for previous errors.";
+  }
+  auto reply_message = flatbuffers::GetRoot<ray::protocol::WaitReply>(reply);
+  // Convert result.
+  std::pair<std::vector<ObjectID>, std::vector<ObjectID>> result;
+  auto found = reply_message->found();
+  for (uint i = 0; i < found->size(); i++) {
+    ObjectID object_id = ObjectID::from_binary(found->Get(i)->str());
+    result.first.push_back(object_id);
+  }
+  auto remaining = reply_message->remaining();
+  for (uint i = 0; i < remaining->size(); i++) {
+    ObjectID object_id = ObjectID::from_binary(remaining->Get(i)->str());
+    result.second.push_back(object_id);
+  }
+  /* Free the original message from the local scheduler. */
+  free(reply);
+  return result;
+}
+
+void local_scheduler_push_error(LocalSchedulerConnection *conn, const JobID &job_id,
+                                const std::string &type, const std::string &error_message,
+                                double timestamp) {
+  flatbuffers::FlatBufferBuilder fbb;
+  auto message = ray::protocol::CreatePushErrorRequest(
+      fbb, to_flatbuf(fbb, job_id), fbb.CreateString(type),
+      fbb.CreateString(error_message), timestamp);
+  fbb.Finish(message);
+
+  write_message(conn->conn,
+                static_cast<int64_t>(ray::protocol::MessageType::PushErrorRequest),
+                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
+}
+
+void local_scheduler_push_profile_events(LocalSchedulerConnection *conn,
+                                         const ProfileTableDataT &profile_events) {
+  flatbuffers::FlatBufferBuilder fbb;
+
+  auto message = CreateProfileTableData(fbb, &profile_events);
+  fbb.Finish(message);
+
+  write_message(conn->conn, static_cast<int64_t>(
+                                ray::protocol::MessageType::PushProfileEventsRequest),
+                fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
+}
+
+void local_scheduler_free_objects_in_object_store(
+    LocalSchedulerConnection *conn, const std::vector<ray::ObjectID> &object_ids,
+    bool local_only) {
+  flatbuffers::FlatBufferBuilder fbb;
+  auto message = ray::protocol::CreateFreeObjectsRequest(fbb, local_only,
+                                                         to_flatbuf(fbb, object_ids));
+  fbb.Finish(message);
+
+  int success = write_message(
+      conn->conn,
+      static_cast<int64_t>(ray::protocol::MessageType::FreeObjectsInObjectStoreRequest),
+      fbb.GetSize(), fbb.GetBufferPointer(), &conn->write_mutex);
+  RAY_CHECK(success == 0) << "Failed to write message to raylet.";
+}
diff --git a/src/ray/raylet/local_scheduler_client.h b/src/ray/raylet/local_scheduler_client.h
new file mode 100644
index 0000000000000..0f975de5c4f33
--- /dev/null
+++ b/src/ray/raylet/local_scheduler_client.h
@@ -0,0 +1,185 @@
+#ifndef LOCAL_SCHEDULER_CLIENT_H
+#define LOCAL_SCHEDULER_CLIENT_H
+
+#include <mutex>
+
+#include "ray/raylet/task_spec.h"
+
+using ray::ObjectID;
+using ray::JobID;
+using ray::TaskID;
+using ray::ActorID;
+using ray::UniqueID;
+
+struct LocalSchedulerConnection {
+  /** File descriptor of the Unix domain socket that connects to local
+   *  scheduler. */
+  int conn;
+  /** The IDs of the GPUs that this client can use. NOTE(rkn): This is only used
+   *  by legacy Ray and will be deprecated. */
+  std::vector<int> gpu_ids;
+  /// A map from resource name to the resource IDs that are currently reserved
+  /// for this worker. Each pair consists of the resource ID and the fraction
+  /// of that resource allocated for this worker.
+  std::unordered_map<std::string, std::vector<std::pair<int64_t, double>>> resource_ids_;
+  /// A mutex to protect stateful operations of the local scheduler client.
+  std::mutex mutex;
+  /// A mutext to protect write operations of the local scheduler client.
+  std::mutex write_mutex;
+};
+
+/**
+ * Connect to the local scheduler.
+ *
+ * @param local_scheduler_socket The name of the socket to use to connect to the
+ *        local scheduler.
+ * @param worker_id A unique ID to represent the worker.
+ * @param is_worker Whether this client is a worker. If it is a worker, an
+ *        additional message will be sent to register as one.
+ * @param driver_id The ID of the driver. This is non-nil if the client is a
+ *        driver.
+ * @return The connection information.
+ */
+LocalSchedulerConnection *LocalSchedulerConnection_init(
+    const char *local_scheduler_socket, const UniqueID &worker_id, bool is_worker,
+    const JobID &driver_id, const Language &language);
+
+/**
+ * Disconnect from the local scheduler.
+ *
+ * @param conn Local scheduler connection information returned by
+ *        LocalSchedulerConnection_init.
+ * @return Void.
+ */
+void LocalSchedulerConnection_free(LocalSchedulerConnection *conn);
+
+/// Submit a task using the raylet code path.
+///
+/// \param The connection information.
+/// \param The execution dependencies.
+/// \param The task specification.
+/// \return Void.
+void local_scheduler_submit_raylet(LocalSchedulerConnection *conn,
+                                   const std::vector<ObjectID> &execution_dependencies,
+                                   const ray::raylet::TaskSpecification &task_spec);
+
+/**
+ * Notify the local scheduler that this client is disconnecting gracefully. This
+ * is used by actors to exit gracefully so that the local scheduler doesn't
+ * propagate an error message to the driver.
+ *
+ * @param conn The connection information.
+ * @return Void.
+ */
+void local_scheduler_disconnect_client(LocalSchedulerConnection *conn);
+
+/// Get next task for this client. This will block until the scheduler assigns
+/// a task to this worker. The caller takes ownership of the returned task
+/// specification and must free it.
+///
+/// \param conn The connection information.
+/// \return The assigned task.
+ray::raylet::TaskSpecification *local_scheduler_get_task_raylet(
+    LocalSchedulerConnection *conn);
+
+/**
+ * Tell the local scheduler that the client has finished executing a task.
+ *
+ * @param conn The connection information.
+ * @return Void.
+ */
+void local_scheduler_task_done(LocalSchedulerConnection *conn);
+
+/**
+ * Tell the local scheduler to reconstruct or fetch objects.
+ *
+ * @param conn The connection information.
+ * @param object_ids The IDs of the objects to reconstruct.
+ * @param fetch_only Only fetch objects, do not reconstruct them.
+ * @param current_task_id The task that needs the objects.
+ * @return int 0 means correct, other numbers mean error.
+ */
+int local_scheduler_fetch_or_reconstruct(LocalSchedulerConnection *conn,
+                                         const std::vector<ObjectID> &object_ids,
+                                         bool fetch_only, const TaskID &current_task_id);
+
+/**
+ * Notify the local scheduler that this client (worker) is no longer blocked.
+ *
+ * @param conn The connection information.
+ * @param current_task_id The task that is no longer blocked.
+ * @return Void.
+ */
+void local_scheduler_notify_unblocked(LocalSchedulerConnection *conn,
+                                      const TaskID &current_task_id);
+
+// /**
+//  * Get an actor's current task frontier.
+//  *
+//  * @param conn The connection information.
+//  * @param actor_id The ID of the actor whose frontier is returned.
+//  * @return A byte vector that can be traversed as an ActorFrontier flatbuffer.
+//  */
+// const std::vector<uint8_t> local_scheduler_get_actor_frontier(
+//     LocalSchedulerConnection *conn,
+//     ActorID actor_id);
+
+// /**
+//  * Set an actor's current task frontier.
+//  *
+//  * @param conn The connection information.
+//  * @param frontier An ActorFrontier flatbuffer to set the frontier to.
+//  * @return Void.
+//  */
+// void local_scheduler_set_actor_frontier(LocalSchedulerConnection *conn,
+//                                         const std::vector<uint8_t> &frontier);
+
+/// Wait for the given objects until timeout expires or num_return objects are
+/// found.
+///
+/// \param conn The connection information.
+/// \param object_ids The objects to wait for.
+/// \param num_returns The number of objects to wait for.
+/// \param timeout_milliseconds Duration, in milliseconds, to wait before
+/// returning.
+/// \param wait_local Whether to wait for objects to appear on this node.
+/// \param current_task_id The task that called wait.
+/// \return A pair with the first element containing the object ids that were
+/// found, and the second element the objects that were not found.
+std::pair<std::vector<ObjectID>, std::vector<ObjectID>> local_scheduler_wait(
+    LocalSchedulerConnection *conn, const std::vector<ObjectID> &object_ids,
+    int num_returns, int64_t timeout_milliseconds, bool wait_local,
+    const TaskID &current_task_id);
+
+/// Push an error to the relevant driver.
+///
+/// \param conn The connection information.
+/// \param The ID of the job that the error is for.
+/// \param The type of the error.
+/// \param The error message.
+/// \param The timestamp of the error.
+/// \return Void.
+void local_scheduler_push_error(LocalSchedulerConnection *conn, const JobID &job_id,
+                                const std::string &type, const std::string &error_message,
+                                double timestamp);
+
+/// Store some profile events in the GCS.
+///
+/// \param conn The connection information.
+/// \param profile_events A batch of profiling event information.
+/// \return Void.
+void local_scheduler_push_profile_events(LocalSchedulerConnection *conn,
+                                         const ProfileTableDataT &profile_events);
+
+/// Free a list of objects from object stores.
+///
+/// \param conn The connection information.
+/// \param object_ids A list of ObjectsIDs to be deleted.
+/// \param local_only Whether keep this request with local object store
+/// or send it to all the object stores.
+/// \return Void.
+void local_scheduler_free_objects_in_object_store(
+    LocalSchedulerConnection *conn, const std::vector<ray::ObjectID> &object_ids,
+    bool local_only);
+
+#endif
diff --git a/src/ray/raylet/main.cc b/src/ray/raylet/main.cc
index 23aa41f25de50..85fa4d0e9522f 100644
--- a/src/ray/raylet/main.cc
+++ b/src/ray/raylet/main.cc
@@ -1,6 +1,6 @@
 #include <iostream>
 
-#include "common/state/ray_config.h"
+#include "ray/ray_config.h"
 #include "ray/raylet/raylet.h"
 #include "ray/status.h"
 
@@ -16,25 +16,46 @@ static std::vector<std::string> parse_worker_command(std::string worker_command)
 
 int main(int argc, char *argv[]) {
   InitShutdownRAII ray_log_shutdown_raii(ray::RayLog::StartRayLog,
-                                         ray::RayLog::ShutDownRayLog, argv[0], RAY_INFO,
+                                         ray::RayLog::ShutDownRayLog, argv[0],
+                                         ray::RayLogLevel::INFO,
                                          /*log_dir=*/"");
   ray::RayLog::InstallFailureSignalHandler();
-  RAY_CHECK(argc == 11);
+  RAY_CHECK(argc >= 14 && argc <= 16);
 
   const std::string raylet_socket_name = std::string(argv[1]);
   const std::string store_socket_name = std::string(argv[2]);
-  const std::string node_ip_address = std::string(argv[3]);
-  const std::string redis_address = std::string(argv[4]);
-  int redis_port = std::stoi(argv[5]);
-  int num_initial_workers = std::stoi(argv[6]);
-  int maximum_startup_concurrency = std::stoi(argv[7]);
-  const std::string static_resource_list = std::string(argv[8]);
-  const std::string python_worker_command = std::string(argv[9]);
-  const std::string java_worker_command = std::string(argv[10]);
+  int object_manager_port = std::stoi(argv[3]);
+  int node_manager_port = std::stoi(argv[4]);
+  const std::string node_ip_address = std::string(argv[5]);
+  const std::string redis_address = std::string(argv[6]);
+  int redis_port = std::stoi(argv[7]);
+  int num_initial_workers = std::stoi(argv[8]);
+  int maximum_startup_concurrency = std::stoi(argv[9]);
+  const std::string static_resource_list = std::string(argv[10]);
+  const std::string config_list = std::string(argv[11]);
+  const std::string python_worker_command = std::string(argv[12]);
+  const std::string java_worker_command = std::string(argv[13]);
+  const std::string redis_password = (argc >= 15 ? std::string(argv[14]) : "");
+  const std::string temp_dir = (argc >= 16 ? std::string(argv[15]) : "/tmp/ray");
 
   // Configuration for the node manager.
   ray::raylet::NodeManagerConfig node_manager_config;
   std::unordered_map<std::string, double> static_resource_conf;
+  std::unordered_map<std::string, int> raylet_config;
+
+  // Parse the configuration list.
+  std::istringstream config_string(config_list);
+  std::string config_name;
+  std::string config_value;
+
+  while (std::getline(config_string, config_name, ',')) {
+    RAY_CHECK(std::getline(config_string, config_value, ','));
+    // TODO(rkn): The line below could throw an exception. What should we do about this?
+    raylet_config[config_name] = std::stoi(config_value);
+  }
+
+  RayConfig::instance().initialize(raylet_config);
+
   // Parse the resource list.
   std::istringstream resource_string(static_resource_list);
   std::string resource_name;
@@ -45,10 +66,12 @@ int main(int argc, char *argv[]) {
     // TODO(rkn): The line below could throw an exception. What should we do about this?
     static_resource_conf[resource_name] = std::stod(resource_quantity);
   }
+
   node_manager_config.resource_config =
       ray::raylet::ResourceSet(std::move(static_resource_conf));
   RAY_LOG(DEBUG) << "Starting raylet with static resource configuration: "
                  << node_manager_config.resource_config.ToString();
+  node_manager_config.node_manager_port = node_manager_port;
   node_manager_config.num_initial_workers = num_initial_workers;
   node_manager_config.num_workers_per_process =
       RayConfig::instance().num_workers_per_process();
@@ -69,11 +92,15 @@ int main(int argc, char *argv[]) {
 
   node_manager_config.heartbeat_period_ms =
       RayConfig::instance().heartbeat_timeout_milliseconds();
+  node_manager_config.debug_dump_period_ms =
+      RayConfig::instance().debug_dump_period_milliseconds();
   node_manager_config.max_lineage_size = RayConfig::instance().max_lineage_size();
   node_manager_config.store_socket_name = store_socket_name;
+  node_manager_config.temp_dir = temp_dir;
 
   // Configuration for the object manager.
   ray::ObjectManagerConfig object_manager_config;
+  object_manager_config.object_manager_port = object_manager_port;
   object_manager_config.store_socket_name = store_socket_name;
   object_manager_config.pull_timeout_ms =
       RayConfig::instance().object_manager_pull_timeout_ms();
@@ -92,7 +119,8 @@ int main(int argc, char *argv[]) {
                  << "object_chunk_size = " << object_manager_config.object_chunk_size;
 
   //  initialize mock gcs & object directory
-  auto gcs_client = std::make_shared<ray::gcs::AsyncGcsClient>(redis_address, redis_port);
+  auto gcs_client = std::make_shared<ray::gcs::AsyncGcsClient>(redis_address, redis_port,
+                                                               redis_password);
   RAY_LOG(DEBUG) << "Initializing GCS client "
                  << gcs_client->client_table().GetLocalClientId();
 
@@ -100,8 +128,8 @@ int main(int argc, char *argv[]) {
   boost::asio::io_service main_service;
 
   ray::raylet::Raylet server(main_service, raylet_socket_name, node_ip_address,
-                             redis_address, redis_port, node_manager_config,
-                             object_manager_config, gcs_client);
+                             redis_address, redis_port, redis_password,
+                             node_manager_config, object_manager_config, gcs_client);
 
   // Destroy the Raylet on a SIGTERM. The pointer to main_service is
   // guaranteed to be valid since this function will run the event loop
diff --git a/src/ray/raylet/monitor.cc b/src/ray/raylet/monitor.cc
index 05cf79309f2d2..baaa7070022d9 100644
--- a/src/ray/raylet/monitor.cc
+++ b/src/ray/raylet/monitor.cc
@@ -1,5 +1,6 @@
 #include "ray/raylet/monitor.h"
 
+#include "ray/ray_config.h"
 #include "ray/status.h"
 #include "ray/util/util.h"
 
@@ -15,21 +16,23 @@ namespace raylet {
 /// the Ray configuration), then the monitor will mark that Raylet as dead in
 /// the client table, which broadcasts the event to all other Raylets.
 Monitor::Monitor(boost::asio::io_service &io_service, const std::string &redis_address,
-                 int redis_port)
-    : gcs_client_(redis_address, redis_port),
+                 int redis_port, const std::string &redis_password)
+    : gcs_client_(redis_address, redis_port, redis_password),
       num_heartbeats_timeout_(RayConfig::instance().num_heartbeats_timeout()),
       heartbeat_timer_(io_service) {
   RAY_CHECK_OK(gcs_client_.Attach(io_service));
 }
 
-void Monitor::HandleHeartbeat(const ClientID &client_id) {
+void Monitor::HandleHeartbeat(const ClientID &client_id,
+                              const HeartbeatTableDataT &heartbeat_data) {
   heartbeats_[client_id] = num_heartbeats_timeout_;
+  heartbeat_buffer_[client_id] = heartbeat_data;
 }
 
 void Monitor::Start() {
   const auto heartbeat_callback = [this](gcs::AsyncGcsClient *client, const ClientID &id,
                                          const HeartbeatTableDataT &heartbeat_data) {
-    HandleHeartbeat(id);
+    HandleHeartbeat(id, heartbeat_data);
   };
   RAY_CHECK_OK(gcs_client_.heartbeat_table().Subscribe(
       UniqueID::nil(), UniqueID::nil(), heartbeat_callback, nullptr, nullptr));
@@ -65,6 +68,18 @@ void Monitor::Tick() {
     }
   }
 
+  // Send any buffered heartbeats as a single publish.
+  if (!heartbeat_buffer_.empty()) {
+    auto batch = std::make_shared<HeartbeatBatchTableDataT>();
+    for (const auto &heartbeat : heartbeat_buffer_) {
+      batch->batch.push_back(std::unique_ptr<HeartbeatTableDataT>(
+          new HeartbeatTableDataT(heartbeat.second)));
+    }
+    RAY_CHECK_OK(gcs_client_.heartbeat_batch_table().Add(UniqueID::nil(), UniqueID::nil(),
+                                                         batch, nullptr));
+    heartbeat_buffer_.clear();
+  }
+
   auto heartbeat_period = boost::posix_time::milliseconds(
       RayConfig::instance().heartbeat_timeout_milliseconds());
   heartbeat_timer_.expires_from_now(heartbeat_period);
diff --git a/src/ray/raylet/monitor.h b/src/ray/raylet/monitor.h
index 1786bc3f1a896..bb698b07f6743 100644
--- a/src/ray/raylet/monitor.h
+++ b/src/ray/raylet/monitor.h
@@ -19,7 +19,7 @@ class Monitor {
   /// \param redis_address The GCS Redis address to connect to.
   /// \param redis_port The GCS Redis port to connect to.
   Monitor(boost::asio::io_service &io_service, const std::string &redis_address,
-          int redis_port);
+          int redis_port, const std::string &redis_password);
 
   /// Start the monitor. Listen for heartbeats from Raylets and mark Raylets
   /// that do not send a heartbeat within a given period as dead.
@@ -33,7 +33,9 @@ class Monitor {
   /// Handle a heartbeat from a Raylet.
   ///
   /// \param client_id The client ID of the Raylet that sent the heartbeat.
-  void HandleHeartbeat(const ClientID &client_id);
+  /// \param heartbeat_data The heartbeat sent by the client.
+  void HandleHeartbeat(const ClientID &client_id,
+                       const HeartbeatTableDataT &heartbeat_data);
 
  private:
   /// A client to the GCS, through which heartbeats are received.
@@ -47,6 +49,8 @@ class Monitor {
   std::unordered_map<ClientID, int64_t> heartbeats_;
   /// The Raylets that have been marked as dead in the client table.
   std::unordered_set<ClientID> dead_clients_;
+  /// A buffer containing heartbeats received from node managers in the last tick.
+  std::unordered_map<ClientID, HeartbeatTableDataT> heartbeat_buffer_;
 };
 
 }  // namespace raylet
diff --git a/src/ray/raylet/monitor_main.cc b/src/ray/raylet/monitor_main.cc
index 218faecd41ead..b12c3cfc2373d 100644
--- a/src/ray/raylet/monitor_main.cc
+++ b/src/ray/raylet/monitor_main.cc
@@ -1,21 +1,39 @@
 #include <iostream>
 
+#include "ray/ray_config.h"
 #include "ray/raylet/monitor.h"
 #include "ray/util/util.h"
 
 int main(int argc, char *argv[]) {
   InitShutdownRAII ray_log_shutdown_raii(ray::RayLog::StartRayLog,
-                                         ray::RayLog::ShutDownRayLog, argv[0], RAY_INFO,
-                                         /*log_dir=*/"");
+                                         ray::RayLog::ShutDownRayLog, argv[0],
+                                         ray::RayLogLevel::INFO, /*log_dir=*/"");
   ray::RayLog::InstallFailureSignalHandler();
-  RAY_CHECK(argc == 3);
+  RAY_CHECK(argc == 4 || argc == 5);
 
   const std::string redis_address = std::string(argv[1]);
   int redis_port = std::stoi(argv[2]);
+  const std::string config_list = std::string(argv[3]);
+  const std::string redis_password = (argc == 5 ? std::string(argv[4]) : "");
+
+  std::unordered_map<std::string, int> raylet_config;
+
+  // Parse the configuration list.
+  std::istringstream config_string(config_list);
+  std::string config_name;
+  std::string config_value;
+
+  while (std::getline(config_string, config_name, ',')) {
+    RAY_CHECK(std::getline(config_string, config_value, ','));
+    // TODO(rkn): The line below could throw an exception. What should we do about this?
+    raylet_config[config_name] = std::stoi(config_value);
+  }
+
+  RayConfig::instance().initialize(raylet_config);
 
   // Initialize the monitor.
   boost::asio::io_service io_service;
-  ray::raylet::Monitor monitor(io_service, redis_address, redis_port);
+  ray::raylet::Monitor monitor(io_service, redis_address, redis_port, redis_password);
   monitor.Start();
   io_service.run();
 }
diff --git a/src/ray/raylet/node_manager.cc b/src/ray/raylet/node_manager.cc
index bed03ad902c39..aa49bcd3b95ec 100644
--- a/src/ray/raylet/node_manager.cc
+++ b/src/ray/raylet/node_manager.cc
@@ -1,52 +1,21 @@
 #include "ray/raylet/node_manager.h"
 
-#include "common_protocol.h"
-// TODO: While removing "local_scheduler_generated.h", remove the dependency
-//       gen_local_scheduler_fbs from src/ray/CMakeLists.txt.
-#include "local_scheduler/format/local_scheduler_generated.h"
+#include <fstream>
+
+#include "ray/common/common_protocol.h"
+#include "ray/id.h"
 #include "ray/raylet/format/node_manager_generated.h"
 
 namespace {
 
-namespace local_scheduler_protocol = ray::local_scheduler::protocol;
-
 #define RAY_CHECK_ENUM(x, y) \
   static_assert(static_cast<int>(x) == static_cast<int>(y), "protocol mismatch")
 
-// Check consistency between client and server protocol.
-RAY_CHECK_ENUM(protocol::MessageType::SubmitTask,
-               local_scheduler_protocol::MessageType::SubmitTask);
-RAY_CHECK_ENUM(protocol::MessageType::TaskDone,
-               local_scheduler_protocol::MessageType::TaskDone);
-RAY_CHECK_ENUM(protocol::MessageType::EventLogMessage,
-               local_scheduler_protocol::MessageType::EventLogMessage);
-RAY_CHECK_ENUM(protocol::MessageType::RegisterClientRequest,
-               local_scheduler_protocol::MessageType::RegisterClientRequest);
-RAY_CHECK_ENUM(protocol::MessageType::RegisterClientReply,
-               local_scheduler_protocol::MessageType::RegisterClientReply);
-RAY_CHECK_ENUM(protocol::MessageType::DisconnectClient,
-               local_scheduler_protocol::MessageType::DisconnectClient);
-RAY_CHECK_ENUM(protocol::MessageType::GetTask,
-               local_scheduler_protocol::MessageType::GetTask);
-RAY_CHECK_ENUM(protocol::MessageType::ExecuteTask,
-               local_scheduler_protocol::MessageType::ExecuteTask);
-RAY_CHECK_ENUM(protocol::MessageType::ReconstructObjects,
-               local_scheduler_protocol::MessageType::ReconstructObjects);
-RAY_CHECK_ENUM(protocol::MessageType::NotifyUnblocked,
-               local_scheduler_protocol::MessageType::NotifyUnblocked);
-RAY_CHECK_ENUM(protocol::MessageType::PutObject,
-               local_scheduler_protocol::MessageType::PutObject);
-RAY_CHECK_ENUM(protocol::MessageType::GetActorFrontierRequest,
-               local_scheduler_protocol::MessageType::GetActorFrontierRequest);
-RAY_CHECK_ENUM(protocol::MessageType::GetActorFrontierReply,
-               local_scheduler_protocol::MessageType::GetActorFrontierReply);
-RAY_CHECK_ENUM(protocol::MessageType::SetActorFrontier,
-               local_scheduler_protocol::MessageType::SetActorFrontier);
-
 /// A helper function to determine whether a given actor task has already been executed
 /// according to the given actor registry. Returns true if the task is a duplicate.
 bool CheckDuplicateActorTask(
-    const std::unordered_map<ActorID, ray::raylet::ActorRegistration> &actor_registry,
+    const std::unordered_map<ray::ActorID, ray::raylet::ActorRegistration>
+        &actor_registry,
     const ray::raylet::TaskSpecification &spec) {
   auto actor_entry = actor_registry.find(spec.ActorId());
   RAY_CHECK(actor_entry != actor_registry.end());
@@ -83,18 +52,20 @@ NodeManager::NodeManager(boost::asio::io_service &io_service,
       gcs_client_(gcs_client),
       heartbeat_timer_(io_service),
       heartbeat_period_(std::chrono::milliseconds(config.heartbeat_period_ms)),
+      debug_dump_period_(config.debug_dump_period_ms),
+      temp_dir_(config.temp_dir),
+      object_manager_profile_timer_(io_service),
       local_resources_(config.resource_config),
       local_available_resources_(config.resource_config),
       worker_pool_(config.num_initial_workers, config.num_workers_per_process,
                    config.maximum_startup_concurrency, config.worker_commands),
-      local_queues_(SchedulingQueue()),
       scheduling_policy_(local_queues_),
       reconstruction_policy_(
           io_service_,
           [this](const TaskID &task_id) { HandleTaskReconstruction(task_id); },
           RayConfig::instance().initial_reconstruction_timeout_milliseconds(),
           gcs_client_->client_table().GetLocalClientId(), gcs_client->task_lease_table(),
-          std::make_shared<ObjectDirectory>(gcs_client),
+          std::make_shared<ObjectDirectory>(io_service, gcs_client),
           gcs_client_->task_reconstruction_log()),
       task_dependency_manager_(
           object_manager, reconstruction_policy_, io_service,
@@ -113,10 +84,11 @@ NodeManager::NodeManager(boost::asio::io_service &io_service,
   cluster_resource_map_.emplace(local_client_id,
                                 SchedulingResources(config.resource_config));
 
-  RAY_CHECK_OK(object_manager_.SubscribeObjAdded([this](const ObjectInfoT &object_info) {
-    ObjectID object_id = ObjectID::from_binary(object_info.object_id);
-    HandleObjectLocal(object_id);
-  }));
+  RAY_CHECK_OK(object_manager_.SubscribeObjAdded(
+      [this](const object_manager::protocol::ObjectInfoT &object_info) {
+        ObjectID object_id = ObjectID::from_binary(object_info.object_id);
+        HandleObjectLocal(object_id);
+      }));
   RAY_CHECK_OK(object_manager_.SubscribeObjDeleted(
       [this](const ObjectID &object_id) { HandleObjectMissing(object_id); }));
 
@@ -163,9 +135,11 @@ ray::Status NodeManager::RegisterGcs() {
       task_lease_notification_callback, task_lease_empty_callback, nullptr));
 
   // Register a callback for actor creation notifications.
-  auto actor_creation_callback = [this](
-      gcs::AsyncGcsClient *client, const ActorID &actor_id,
-      const std::vector<ActorTableDataT> &data) { HandleActorCreation(actor_id, data); };
+  auto actor_creation_callback = [this](gcs::AsyncGcsClient *client,
+                                        const ActorID &actor_id,
+                                        const std::vector<ActorTableDataT> &data) {
+    HandleActorStateTransition(actor_id, data.back());
+  };
 
   RAY_RETURN_NOT_OK(gcs_client_->actor_table().Subscribe(
       UniqueID::nil(), UniqueID::nil(), actor_creation_callback, nullptr));
@@ -183,15 +157,16 @@ ray::Status NodeManager::RegisterGcs() {
   };
   gcs_client_->client_table().RegisterClientRemovedCallback(node_manager_client_removed);
 
-  // Subscribe to node manager heartbeats.
-  const auto heartbeat_added = [this](gcs::AsyncGcsClient *client, const ClientID &id,
-                                      const HeartbeatTableDataT &heartbeat_data) {
-    HeartbeatAdded(client, id, heartbeat_data);
+  // Subscribe to heartbeat batches from the monitor.
+  const auto &heartbeat_batch_added = [this](
+      gcs::AsyncGcsClient *client, const ClientID &id,
+      const HeartbeatBatchTableDataT &heartbeat_batch) {
+    HeartbeatBatchAdded(heartbeat_batch);
   };
-  RAY_RETURN_NOT_OK(gcs_client_->heartbeat_table().Subscribe(
-      UniqueID::nil(), UniqueID::nil(), heartbeat_added, nullptr,
+  RAY_RETURN_NOT_OK(gcs_client_->heartbeat_batch_table().Subscribe(
+      UniqueID::nil(), UniqueID::nil(), heartbeat_batch_added, nullptr,
       [](gcs::AsyncGcsClient *client) {
-        RAY_LOG(DEBUG) << "heartbeat table subscription done callback called.";
+        RAY_LOG(DEBUG) << "Heartbeat batch table subscription done.";
       }));
 
   // Subscribe to driver table updates.
@@ -205,7 +180,11 @@ ray::Status NodeManager::RegisterGcs() {
 
   // Start sending heartbeats to the GCS.
   last_heartbeat_at_ms_ = current_time_ms();
+  last_debug_dump_at_ms_ = current_time_ms();
   Heartbeat();
+  // Start the timer that gets object manager profiling information and sends it
+  // to the GCS.
+  GetObjectManagerProfileInfo();
 
   return ray::Status::OK();
 }
@@ -222,7 +201,8 @@ void NodeManager::KillWorker(std::shared_ptr<Worker> worker) {
   retry_timer->expires_from_now(retry_duration);
   retry_timer->async_wait([retry_timer, worker](const boost::system::error_code &error) {
     RAY_LOG(DEBUG) << "Send SIGKILL to worker, pid=" << worker->Pid();
-    // Force kill worker.
+    // Force kill worker. TODO(rkn): Is there some small danger that the worker
+    // has already died and the PID has been reassigned to a different process?
     kill(worker->Pid(), SIGKILL);
   });
 }
@@ -303,6 +283,12 @@ void NodeManager::Heartbeat() {
   }
   RAY_CHECK_OK(status);
 
+  if (debug_dump_period_ > 0 &&
+      static_cast<int64_t>(now_ms - last_debug_dump_at_ms_) > debug_dump_period_) {
+    DumpDebugState();
+    last_debug_dump_at_ms_ = now_ms;
+  }
+
   // Reset the timer.
   heartbeat_timer_.expires_from_now(heartbeat_period_);
   heartbeat_timer_.async_wait([this](const boost::system::error_code &error) {
@@ -311,6 +297,34 @@ void NodeManager::Heartbeat() {
   });
 }
 
+void NodeManager::GetObjectManagerProfileInfo() {
+  int64_t start_time_ms = current_time_ms();
+
+  auto profile_info = object_manager_.GetAndResetProfilingInfo();
+
+  if (profile_info.profile_events.size() > 0) {
+    flatbuffers::FlatBufferBuilder fbb;
+    auto message = CreateProfileTableData(fbb, &profile_info);
+    fbb.Finish(message);
+    auto profile_message = flatbuffers::GetRoot<ProfileTableData>(fbb.GetBufferPointer());
+
+    RAY_CHECK_OK(gcs_client_->profile_table().AddProfileEventBatch(*profile_message));
+  }
+
+  // Reset the timer.
+  object_manager_profile_timer_.expires_from_now(heartbeat_period_);
+  object_manager_profile_timer_.async_wait(
+      [this](const boost::system::error_code &error) {
+        RAY_CHECK(!error);
+        GetObjectManagerProfileInfo();
+      });
+
+  int64_t interval = current_time_ms() - start_time_ms;
+  if (interval > RayConfig::instance().handler_warning_timeout_ms()) {
+    RAY_LOG(WARNING) << "GetObjectManagerProfileInfo handler took " << interval << " ms.";
+  }
+}
+
 void NodeManager::ClientAdded(const ClientTableDataT &client_data) {
   const ClientID client_id = ClientID::from_binary(client_data.client_id);
 
@@ -335,14 +349,13 @@ void NodeManager::ClientAdded(const ClientTableDataT &client_data) {
   }
 
   // Establish a new NodeManager connection to this GCS client.
-  auto client_info = gcs_client_->client_table().GetClient(client_id);
   RAY_LOG(DEBUG) << "[ClientAdded] Trying to connect to client " << client_id << " at "
-                 << client_info.node_manager_address << ":"
-                 << client_info.node_manager_port;
+                 << client_data.node_manager_address << ":"
+                 << client_data.node_manager_port;
 
   boost::asio::ip::tcp::socket socket(io_service_);
   auto status =
-      TcpConnect(socket, client_info.node_manager_address, client_info.node_manager_port);
+      TcpConnect(socket, client_data.node_manager_address, client_data.node_manager_port);
   // A disconnected client has 2 entries in the client table (one for being
   // inserted and one for being removed). When a new raylet starts, ClientAdded
   // will be called with the disconnected client's first entry, which will cause
@@ -356,7 +369,7 @@ void NodeManager::ClientAdded(const ClientTableDataT &client_data) {
   }
 
   // The client is connected.
-  auto server_conn = TcpServerConnection(std::move(socket));
+  auto server_conn = TcpServerConnection::Create(std::move(socket));
   remote_server_connections_.emplace(client_id, std::move(server_conn));
 
   ResourceSet resources_total(client_data.resources_total_label,
@@ -386,19 +399,24 @@ void NodeManager::ClientRemoved(const ClientTableDataT &client_data) {
 
   // Remove the remote server connection.
   remote_server_connections_.erase(client_id);
+
+  // For any live actors that were on the dead node, broadcast a notification
+  // about the actor's death
+  // TODO(swang): This could be very slow if there are many actors.
+  for (const auto &actor_entry : actor_registry_) {
+    if (actor_entry.second.GetNodeManagerId() == client_id &&
+        actor_entry.second.IsAlive()) {
+      HandleDisconnectedActor(actor_entry.first, /*was_local=*/false);
+    }
+  }
 }
 
-void NodeManager::HeartbeatAdded(gcs::AsyncGcsClient *client, const ClientID &client_id,
+void NodeManager::HeartbeatAdded(const ClientID &client_id,
                                  const HeartbeatTableDataT &heartbeat_data) {
   RAY_LOG(DEBUG) << "[HeartbeatAdded]: received heartbeat from client id " << client_id;
-  const ClientID &local_client_id = gcs_client_->client_table().GetLocalClientId();
-  if (client_id == local_client_id) {
-    // Skip heartbeats from self.
-    return;
-  }
   // Locate the client id in remote client table and update available resources based on
   // the received heartbeat information.
-  auto it = this->cluster_resource_map_.find(client_id);
+  auto it = cluster_resource_map_.find(client_id);
   if (it == cluster_resource_map_.end()) {
     // Haven't received the client registration for this client yet, skip this heartbeat.
     RAY_LOG(INFO) << "[HeartbeatAdded]: received heartbeat from unknown client id "
@@ -416,48 +434,94 @@ void NodeManager::HeartbeatAdded(gcs::AsyncGcsClient *client, const ClientID &cl
   remote_resources.SetAvailableResources(std::move(remote_available));
   // Extract the load information and save it locally.
   remote_resources.SetLoadResources(std::move(remote_load));
-
-  auto decision = scheduling_policy_.SpillOver(remote_resources);
   // Extract decision for this local scheduler.
+  auto decision = scheduling_policy_.SpillOver(remote_resources);
   std::unordered_set<TaskID> local_task_ids;
   for (const auto &task_id : decision) {
     // (See design_docs/task_states.rst for the state transition diagram.)
-    const auto task = local_queues_.RemoveTask(task_id);
+    TaskState state;
+    const auto task = local_queues_.RemoveTask(task_id, &state);
     // Since we are spilling back from the ready and waiting queues, we need
     // to unsubscribe the dependencies.
-    task_dependency_manager_.UnsubscribeDependencies(task_id);
+    if (state != TaskState::INFEASIBLE) {
+      // Don't unsubscribe for infeasible tasks because we never subscribed in
+      // the first place.
+      RAY_CHECK(task_dependency_manager_.UnsubscribeDependencies(task_id));
+    }
     // Attempt to forward the task. If this fails to forward the task,
     // the task will be resubmit locally.
     ForwardTaskOrResubmit(task, client_id);
   }
 }
 
-void NodeManager::HandleActorCreation(const ActorID &actor_id,
-                                      const std::vector<ActorTableDataT> &data) {
-  RAY_LOG(DEBUG) << "Actor creation notification received: " << actor_id;
+void NodeManager::HeartbeatBatchAdded(const HeartbeatBatchTableDataT &heartbeat_batch) {
+  const ClientID &local_client_id = gcs_client_->client_table().GetLocalClientId();
+  // Update load information provided by each heartbeat.
+  for (const auto &heartbeat_data : heartbeat_batch.batch) {
+    const ClientID &client_id = ClientID::from_binary(heartbeat_data->client_id);
+    if (client_id == local_client_id) {
+      // Skip heartbeats from self.
+      continue;
+    }
+    HeartbeatAdded(client_id, *heartbeat_data);
+  }
+}
 
-  // TODO(swang): In presence of failures, data may have size > 1, since the
-  // actor will have been created multiple times. In that case, we should
-  // only consider the last entry as valid. All previous entries should have
-  // a dead node_manager_id.
-  RAY_CHECK(data.size() == 1);
+void NodeManager::HandleDisconnectedActor(const ActorID &actor_id, bool was_local) {
+  RAY_LOG(DEBUG) << "Actor disconnected " << actor_id;
+  auto actor_entry = actor_registry_.find(actor_id);
+  RAY_CHECK(actor_entry != actor_registry_.end());
+
+  // Release all the dummy objects for the dead actor.
+  if (was_local) {
+    for (auto &dummy_object : actor_entry->second.GetDummyObjects()) {
+      HandleObjectMissing(dummy_object);
+    }
+  }
+
+  auto new_actor_data =
+      std::make_shared<ActorTableDataT>(actor_entry->second.GetTableData());
+  new_actor_data->state = ActorState::DEAD;
+  HandleActorStateTransition(actor_id, *new_actor_data);
+  ray::gcs::ActorTable::WriteCallback failure_callback = nullptr;
+  if (was_local) {
+    // The actor was local to this node, so we are the only one who should try
+    // to update the log.
+    failure_callback = [](gcs::AsyncGcsClient *client, const ActorID &id,
+                          const ActorTableDataT &data) {
+      RAY_LOG(FATAL) << "Failed to update state to DEAD for actor " << id;
+    };
+  }
+  // Actor reconstruction is disabled, so the actor can only go from ALIVE to
+  // DEAD. The DEAD entry must therefore be at the second index in the log.
+  RAY_CHECK_OK(gcs_client_->actor_table().AppendAt(JobID::nil(), actor_id, new_actor_data,
+                                                   nullptr, failure_callback,
+                                                   /*log_index=*/1));
+}
+
+void NodeManager::HandleActorStateTransition(const ActorID &actor_id,
+                                             const ActorTableDataT &data) {
+  RAY_LOG(DEBUG) << "Actor creation notification received: " << actor_id << " "
+                 << static_cast<int>(data.state);
 
   // Register the new actor.
-  ActorRegistration actor_registration(data.back());
-  ClientID received_node_manager_id = actor_registration.GetNodeManagerId();
-  // Extend the frontier to include the actor creation task. NOTE(swang): The
-  // creator of the actor is always assigned nil as the actor handle ID.
-  actor_registration.ExtendFrontier(ActorHandleID::nil(),
-                                    actor_registration.GetActorCreationDependency());
-  auto inserted = actor_registry_.emplace(actor_id, std::move(actor_registration));
-  if (!inserted.second) {
-    // If we weren't able to insert the actor's location, check that the
-    // existing entry is the same as the new one.
-    // TODO(swang): This is not true in the case of failures.
-    RAY_CHECK(received_node_manager_id == inserted.first->second.GetNodeManagerId())
-        << "Actor scheduled on " << inserted.first->second.GetNodeManagerId()
-        << ", but received notification for " << received_node_manager_id;
+  ActorRegistration actor_registration(data);
+  // Update local registry.
+  auto it = actor_registry_.find(actor_id);
+  if (it == actor_registry_.end()) {
+    it = actor_registry_.emplace(actor_id, actor_registration).first;
   } else {
+    RAY_CHECK(it->second.GetNodeManagerId() == actor_registration.GetNodeManagerId());
+    if (actor_registration.GetState() > it->second.GetState()) {
+      // The new state is later than our current state.
+      it->second = actor_registration;
+    } else {
+      // Our state is already at or past the update, so skip the update.
+      return;
+    }
+  }
+
+  if (it->second.IsAlive()) {
     // The actor's location is now known. Dequeue any methods that were
     // submitted before the actor's location was known.
     // (See design_docs/task_states.rst for the state transition diagram.)
@@ -477,22 +541,26 @@ void NodeManager::HandleActorCreation(const ActorID &actor_id,
                          << " already removed from the lineage cache. This is most "
                             "likely due to reconstruction.";
       }
+      // Maintain the invariant that if a task is in the
+      // MethodsWaitingForActorCreation queue, then it is subscribed to its
+      // respective actor creation task and that task only. Since the actor
+      // location is now known, we can remove the task from the queue and
+      // forget its dependency on the actor creation task.
+      RAY_CHECK(task_dependency_manager_.UnsubscribeDependencies(
+          method.GetTaskSpecification().TaskId()));
       // The task's uncommitted lineage was already added to the local lineage
       // cache upon the initial submission, so it's okay to resubmit it with an
       // empty lineage this time.
       SubmitTask(method, Lineage());
     }
-  }
-}
-
-void NodeManager::CleanUpTasksForDeadActor(const ActorID &actor_id) {
-  auto tasks_to_remove = local_queues_.GetTaskIdsForActor(actor_id);
-  auto removed_tasks = local_queues_.RemoveTasks(tasks_to_remove);
-
-  for (auto const &task : removed_tasks) {
-    const TaskSpecification &spec = task.GetTaskSpecification();
-    TreatTaskAsFailed(spec);
-    task_dependency_manager_.TaskCanceled(spec.TaskId());
+  } else {
+    // When an actor dies, loop over all of the queued tasks for that actor
+    // and treat them as failed.
+    auto tasks_to_remove = local_queues_.GetTaskIdsForActor(actor_id);
+    auto removed_tasks = local_queues_.RemoveTasks(tasks_to_remove);
+    for (auto const &task : removed_tasks) {
+      TreatTaskAsFailed(task);
+    }
   }
 }
 
@@ -508,28 +576,36 @@ void NodeManager::ProcessNewClient(LocalClientConnection &client) {
   client.ProcessMessages();
 }
 
-void NodeManager::DispatchTasks() {
-  // Work with a copy of scheduled tasks.
-  // (See design_docs/task_states.rst for the state transition diagram.)
-  auto ready_tasks = local_queues_.GetReadyTasks();
-  // Return if there are no tasks to schedule.
-  if (ready_tasks.empty()) {
-    return;
+// A helper function to create a mapping from resource shapes to
+// tasks with that resource shape from a given list of tasks.
+std::unordered_map<ResourceSet, ordered_set<TaskID>> MakeTasksWithResources(
+    const std::vector<Task> &tasks) {
+  std::unordered_map<ResourceSet, ordered_set<TaskID>> result;
+  for (const auto &task : tasks) {
+    auto spec = task.GetTaskSpecification();
+    result[spec.GetRequiredResources()].push_back(spec.TaskId());
   }
+  return result;
+}
 
-  for (const auto &task : ready_tasks) {
-    const auto &task_resources = task.GetTaskSpecification().GetRequiredResources();
-    if (!local_available_resources_.Contains(task_resources)) {
-      // Not enough local resources for this task right now, skip this task.
-      // TODO(rkn): We should always skip node managers that have 0 CPUs.
-      continue;
+void NodeManager::DispatchTasks(
+    const std::unordered_map<ResourceSet, ordered_set<TaskID>> &tasks_with_resources) {
+  std::unordered_set<TaskID> removed_task_ids;
+  for (const auto &it : tasks_with_resources) {
+    for (const auto &task_id : it.second) {
+      const auto &task = local_queues_.GetReadyQueue().GetTask(task_id);
+      const auto &task_resources = task.GetTaskSpecification().GetRequiredResources();
+      if (!local_available_resources_.Contains(task_resources)) {
+        // All the tasks in it.second have the same resource shape, so
+        // once the first task is not feasible, we can break out of this loop
+        break;
+      }
+      if (AssignTask(task)) {
+        removed_task_ids.insert(task_id);
+      }
     }
-    // We have enough resources for this task. Assign task.
-    // TODO(atumanov): perform the task state/queue transition inside AssignTask.
-    // (See design_docs/task_states.rst for the state transition diagram.)
-    auto dispatched_task = local_queues_.RemoveTask(task.GetTaskSpecification().TaskId());
-    AssignTask(dispatched_task);
   }
+  local_queues_.RemoveTasks(removed_task_ids);
 }
 
 void NodeManager::ProcessClientMessage(
@@ -538,18 +614,19 @@ void NodeManager::ProcessClientMessage(
   RAY_LOG(DEBUG) << "Message of type " << message_type;
 
   auto registered_worker = worker_pool_.GetRegisteredWorker(client);
+  auto message_type_value = static_cast<protocol::MessageType>(message_type);
   if (registered_worker && registered_worker->IsDead()) {
     // For a worker that is marked as dead (because the driver has died already),
     // all the messages are ignored except DisconnectClient.
-    if (static_cast<protocol::MessageType>(message_type) !=
-        protocol::MessageType::DisconnectClient) {
+    if ((message_type_value != protocol::MessageType::DisconnectClient) &&
+        (message_type_value != protocol::MessageType::IntentionalDisconnectClient)) {
       // Listen for more messages.
       client->ProcessMessages();
       return;
     }
   }
 
-  switch (static_cast<protocol::MessageType>(message_type)) {
+  switch (message_type_value) {
   case protocol::MessageType::RegisterClientRequest: {
     ProcessRegisterClientRequestMessage(client, message_data);
   } break;
@@ -562,14 +639,21 @@ void NodeManager::ProcessClientMessage(
     // because it's already disconnected.
     return;
   } break;
+  case protocol::MessageType::IntentionalDisconnectClient: {
+    ProcessDisconnectClientMessage(client, /* push_warning = */ false);
+    // We don't need to receive future messages from this client,
+    // because it's already disconnected.
+    return;
+  } break;
   case protocol::MessageType::SubmitTask: {
     ProcessSubmitTaskMessage(message_data);
   } break;
-  case protocol::MessageType::ReconstructObjects: {
-    ProcessReconstructObjectsMessage(client, message_data);
+  case protocol::MessageType::FetchOrReconstruct: {
+    ProcessFetchOrReconstructMessage(client, message_data);
   } break;
   case protocol::MessageType::NotifyUnblocked: {
-    HandleClientUnblocked(client);
+    auto message = flatbuffers::GetRoot<protocol::NotifyUnblocked>(message_data);
+    HandleTaskUnblocked(client, from_flatbuf(*message->task_id()));
   } break;
   case protocol::MessageType::WaitRequest: {
     ProcessWaitRequestMessage(client, message_data);
@@ -604,7 +688,7 @@ void NodeManager::ProcessRegisterClientRequestMessage(
   if (message->is_worker()) {
     // Register the new worker.
     worker_pool_.RegisterWorker(std::move(worker));
-    DispatchTasks();
+    DispatchTasks(local_queues_.GetReadyQueue().GetTasksWithResources());
   } else {
     // Register the new driver. Note that here the driver_id in RegisterClientRequest
     // message is actually the ID of the driver task, while client_id represents the
@@ -633,15 +717,41 @@ void NodeManager::ProcessGetTaskMessage(
   cluster_resource_map_[local_client_id].SetLoadResources(
       local_queues_.GetResourceLoad());
   // Call task dispatch to assign work to the new worker.
-  DispatchTasks();
+  DispatchTasks(local_queues_.GetReadyQueue().GetTasksWithResources());
 }
 
 void NodeManager::ProcessDisconnectClientMessage(
-    const std::shared_ptr<LocalClientConnection> &client) {
-  // Remove the dead worker from the pool and stop listening for messages.
-  const std::shared_ptr<Worker> worker = worker_pool_.GetRegisteredWorker(client);
+    const std::shared_ptr<LocalClientConnection> &client, bool push_warning) {
+  std::shared_ptr<Worker> worker = worker_pool_.GetRegisteredWorker(client);
+  bool is_worker = false, is_driver = false;
+  if (worker) {
+    // The client is a worker.
+    is_worker = true;
+  } else {
+    worker = worker_pool_.GetRegisteredDriver(client);
+    if (worker) {
+      // The client is a driver.
+      is_driver = true;
+    } else {
+      RAY_LOG(INFO) << "Ignoring client disconnect because the client has already "
+                    << "been disconnected.";
+    }
+  }
+  RAY_CHECK(!(is_worker && is_driver));
 
+  // If the client has any blocked tasks, mark them as unblocked. In
+  // particular, we are no longer waiting for their dependencies.
   if (worker) {
+    while (!worker->GetBlockedTaskIds().empty()) {
+      // NOTE(swang): HandleTaskUnblocked will modify the worker, so it is
+      // not safe to pass in the iterator directly.
+      const TaskID task_id = *worker->GetBlockedTaskIds().begin();
+      HandleTaskUnblocked(client, task_id);
+    }
+  }
+
+  // Remove the dead client from the pool and stop listening for messages.
+  if (is_worker) {
     // The client is a worker. Handle the case where the worker is killed
     // while executing a task. Clean up the assigned task's resources, push
     // an error to the driver.
@@ -651,46 +761,32 @@ void NodeManager::ProcessDisconnectClientMessage(
       // If the worker was killed intentionally, e.g., when the driver that created
       // the task that this worker is currently executing exits, the task for this
       // worker has already been removed from queue, so the following are skipped.
-      auto const &running_tasks = local_queues_.GetRunningTasks();
-      // TODO(rkn): This is too heavyweight just to get the task's driver ID.
-      auto const it = std::find_if(
-          running_tasks.begin(), running_tasks.end(), [task_id](const Task &task) {
-            return task.GetTaskSpecification().TaskId() == task_id;
-          });
-      RAY_CHECK(running_tasks.size() != 0);
-      RAY_CHECK(it != running_tasks.end());
-      const TaskSpecification &spec = it->GetTaskSpecification();
-      const JobID job_id = spec.DriverId();
-
-      // TODO(rkn): Define this constant somewhere else.
-      std::string type = "worker_died";
-      std::ostringstream error_message;
-      error_message << "A worker died or was killed while executing task " << task_id
-                    << ".";
-      RAY_CHECK_OK(gcs_client_->error_table().PushErrorToDriver(
-          job_id, type, error_message.str(), current_time_ms()));
-
+      const Task &task = local_queues_.RemoveTask(task_id);
       // Handle the task failure in order to raise an exception in the
       // application.
-      TreatTaskAsFailed(spec);
-      task_dependency_manager_.TaskCanceled(spec.TaskId());
-      local_queues_.RemoveTask(spec.TaskId());
+      TreatTaskAsFailed(task);
+
+      const JobID &job_id = worker->GetAssignedDriverId();
+
+      if (push_warning) {
+        // TODO(rkn): Define this constant somewhere else.
+        std::string type = "worker_died";
+        std::ostringstream error_message;
+        error_message << "A worker died or was killed while executing task " << task_id
+                      << ".";
+        RAY_CHECK_OK(gcs_client_->error_table().PushErrorToDriver(
+            job_id, type, error_message.str(), current_time_ms()));
+      }
     }
 
     worker_pool_.DisconnectWorker(worker);
 
     // If the worker was an actor, add it to the list of dead actors.
-    const ActorID actor_id = worker->GetActorId();
+    const ActorID &actor_id = worker->GetActorId();
     if (!actor_id.is_nil()) {
-      // TODO(rkn): Consider broadcasting a message to all of the other
-      // node managers so that they can mark the actor as dead.
-      RAY_LOG(DEBUG) << "The actor with ID " << actor_id << " died.";
-      auto actor_entry = actor_registry_.find(actor_id);
-      RAY_CHECK(actor_entry != actor_registry_.end());
-      actor_entry->second.MarkDead();
-      // For dead actors, if there are remaining tasks for this actor, we
-      // should handle them.
-      CleanUpTasksForDeadActor(actor_id);
+      RAY_LOG(DEBUG) << "The actor with ID " << actor_id << " died on "
+                     << gcs_client_->client_table().GetLocalClientId();
+      HandleDisconnectedActor(actor_id, /*was_local=*/true);
     }
 
     const ClientID &client_id = gcs_client_->client_table().GetLocalClientId();
@@ -710,21 +806,23 @@ void NodeManager::ProcessDisconnectClientMessage(
                    << "driver_id: " << worker->GetAssignedDriverId();
 
     // Since some resources may have been released, we can try to dispatch more tasks.
-    DispatchTasks();
-  } else {
+    DispatchTasks(local_queues_.GetReadyQueue().GetTasksWithResources());
+  } else if (is_driver) {
     // The client is a driver.
-    RAY_CHECK_OK(gcs_client_->driver_table().AppendDriverData(client->GetClientID(),
+    RAY_CHECK_OK(gcs_client_->driver_table().AppendDriverData(client->GetClientId(),
                                                               /*is_dead=*/true));
-    const std::shared_ptr<Worker> driver = worker_pool_.GetRegisteredDriver(client);
-    RAY_CHECK(driver);
-    auto driver_id = driver->GetAssignedTaskId();
+    auto driver_id = worker->GetAssignedTaskId();
     RAY_CHECK(!driver_id.is_nil());
     local_queues_.RemoveDriverTaskId(driver_id);
-    worker_pool_.DisconnectDriver(driver);
+    worker_pool_.DisconnectDriver(worker);
 
-    RAY_LOG(DEBUG) << "Driver (pid=" << driver->Pid() << ") is disconnected. "
-                   << "driver_id: " << driver->GetAssignedDriverId();
+    RAY_LOG(DEBUG) << "Driver (pid=" << worker->Pid() << ") is disconnected. "
+                   << "driver_id: " << worker->GetAssignedDriverId();
   }
+
+  // TODO(rkn): Tell the object manager that this client has disconnected so
+  // that it can clean up the wait requests for this client. Currently I think
+  // these can be leaked.
 }
 
 void NodeManager::ProcessSubmitTaskMessage(const uint8_t *message_data) {
@@ -739,29 +837,31 @@ void NodeManager::ProcessSubmitTaskMessage(const uint8_t *message_data) {
   SubmitTask(task, Lineage());
 }
 
-void NodeManager::ProcessReconstructObjectsMessage(
+void NodeManager::ProcessFetchOrReconstructMessage(
     const std::shared_ptr<LocalClientConnection> &client, const uint8_t *message_data) {
-  auto message = flatbuffers::GetRoot<protocol::ReconstructObjects>(message_data);
+  auto message = flatbuffers::GetRoot<protocol::FetchOrReconstruct>(message_data);
   std::vector<ObjectID> required_object_ids;
   for (size_t i = 0; i < message->object_ids()->size(); ++i) {
     ObjectID object_id = from_flatbuf(*message->object_ids()->Get(i));
-    if (!task_dependency_manager_.CheckObjectLocal(object_id)) {
-      if (message->fetch_only()) {
-        // If only a fetch is required, then do not subscribe to the
-        // dependencies to the task dependency manager.
+    if (message->fetch_only()) {
+      // If only a fetch is required, then do not subscribe to the
+      // dependencies to the task dependency manager.
+      if (!task_dependency_manager_.CheckObjectLocal(object_id)) {
+        // Fetch the object if it's not already local.
         RAY_CHECK_OK(object_manager_.Pull(object_id));
-      } else {
-        // If reconstruction is also required, then add any missing objects
-        // to the list to subscribe to in the task dependency manager. These
-        // objects will be pulled from remote node managers and reconstructed
-        // if necessary.
-        required_object_ids.push_back(object_id);
       }
+    } else {
+      // If reconstruction is also required, then add any requested objects to
+      // the list to subscribe to in the task dependency manager. These objects
+      // will be pulled from remote node managers and reconstructed if
+      // necessary.
+      required_object_ids.push_back(object_id);
     }
   }
 
   if (!required_object_ids.empty()) {
-    HandleClientBlocked(client, required_object_ids);
+    const TaskID task_id = from_flatbuf(*message->task_id());
+    HandleTaskBlocked(client, required_object_ids, task_id);
   }
 }
 
@@ -784,26 +884,36 @@ void NodeManager::ProcessWaitRequestMessage(
     }
   }
 
+  const TaskID &current_task_id = from_flatbuf(*message->task_id());
   bool client_blocked = !required_object_ids.empty();
   if (client_blocked) {
-    HandleClientBlocked(client, required_object_ids);
+    HandleTaskBlocked(client, required_object_ids, current_task_id);
   }
 
   ray::Status status = object_manager_.Wait(
       object_ids, wait_ms, num_required_objects, wait_local,
-      [this, client_blocked, client](std::vector<ObjectID> found,
-                                     std::vector<ObjectID> remaining) {
+      [this, client_blocked, client, current_task_id](std::vector<ObjectID> found,
+                                                      std::vector<ObjectID> remaining) {
         // Write the data.
         flatbuffers::FlatBufferBuilder fbb;
         flatbuffers::Offset<protocol::WaitReply> wait_reply = protocol::CreateWaitReply(
             fbb, to_flatbuf(fbb, found), to_flatbuf(fbb, remaining));
         fbb.Finish(wait_reply);
-        RAY_CHECK_OK(
+
+        auto status =
             client->WriteMessage(static_cast<int64_t>(protocol::MessageType::WaitReply),
-                                 fbb.GetSize(), fbb.GetBufferPointer()));
-        // The client is unblocked now because the wait call has returned.
-        if (client_blocked) {
-          HandleClientUnblocked(client);
+                                 fbb.GetSize(), fbb.GetBufferPointer());
+        if (status.ok()) {
+          // The client is unblocked now because the wait call has returned.
+          if (client_blocked) {
+            HandleTaskUnblocked(client, current_task_id);
+          }
+        } else {
+          // We failed to write to the client, so disconnect the client.
+          RAY_LOG(WARNING)
+              << "Failed to send WaitReply to client, so disconnecting client";
+          // We failed to send the reply to the client, so disconnect the worker.
+          ProcessDisconnectClientMessage(client);
         }
       });
   RAY_CHECK_OK(status);
@@ -911,17 +1021,20 @@ void NodeManager::ScheduleTasks(
       // TODO(rkn): Define this constant somewhere else.
       std::string type = "infeasible_task";
       std::ostringstream error_message;
-      error_message << "The task with ID " << task.GetTaskSpecification().TaskId()
-                    << " is infeasible and cannot currently be executed. "
-                    << "It requested "
-                    << task.GetTaskSpecification().GetRequiredResources().ToString();
+      error_message
+          << "The task with ID " << task.GetTaskSpecification().TaskId()
+          << " is infeasible and cannot currently be executed. It requires "
+          << task.GetTaskSpecification().GetRequiredResources().ToString()
+          << " for execution and "
+          << task.GetTaskSpecification().GetRequiredPlacementResources().ToString()
+          << " for placement. Check the client table to view node resources.";
       RAY_CHECK_OK(gcs_client_->error_table().PushErrorToDriver(
           task.GetTaskSpecification().DriverId(), type, error_message.str(),
           current_time_ms()));
     }
     // Assert that this placeable task is not feasible locally (necessary but not
     // sufficient).
-    RAY_CHECK(!task.GetTaskSpecification().GetRequiredResources().IsSubset(
+    RAY_CHECK(!task.GetTaskSpecification().GetRequiredPlacementResources().IsSubset(
         cluster_resource_map_[gcs_client_->client_table().GetLocalClientId()]
             .GetTotalResources()));
   }
@@ -945,7 +1058,8 @@ bool NodeManager::CheckDependencyManagerInvariant() const {
   return true;
 }
 
-void NodeManager::TreatTaskAsFailed(const TaskSpecification &spec) {
+void NodeManager::TreatTaskAsFailed(const Task &task) {
+  const TaskSpecification &spec = task.GetTaskSpecification();
   RAY_LOG(DEBUG) << "Treating task " << spec.TaskId() << " as failed.";
   // Loop over the return IDs (except the dummy ID) and store a fake object in
   // the object store.
@@ -971,11 +1085,22 @@ void NodeManager::TreatTaskAsFailed(const TaskSpecification &spec) {
       ARROW_CHECK_OK(store_client_.Seal(object_id.to_plasma_id()));
     }
   }
+  // A task failing is equivalent to assigning and finishing the task, so clean
+  // up any leftover state as for any task dispatched and removed from the
+  // local queue.
+  lineage_cache_.AddReadyTask(task);
+  task_dependency_manager_.TaskCanceled(spec.TaskId());
+  // Notify the task dependency manager that we no longer need this task's
+  // object dependencies. TODO(swang): Ideally, we would check the return value
+  // here. However, we don't know at this point if the task was in the WAITING
+  // or READY queue before, in which case we would not have been subscribed to
+  // its dependencies.
+  task_dependency_manager_.UnsubscribeDependencies(spec.TaskId());
 }
 
 void NodeManager::SubmitTask(const Task &task, const Lineage &uncommitted_lineage,
                              bool forwarded) {
-  const TaskID task_id = task.GetTaskSpecification().TaskId();
+  const TaskID &task_id = task.GetTaskSpecification().TaskId();
   if (local_queues_.HasTask(task_id)) {
     RAY_LOG(WARNING) << "Submitted task " << task_id
                      << " is already queued and will not be reconstructed. This is most "
@@ -995,27 +1120,21 @@ void NodeManager::SubmitTask(const Task &task, const Lineage &uncommitted_lineag
     // Check whether we know the location of the actor.
     const auto actor_entry = actor_registry_.find(spec.ActorId());
     if (actor_entry != actor_registry_.end()) {
-      // We have a known location for the actor.
-      auto node_manager_id = actor_entry->second.GetNodeManagerId();
-      if (node_manager_id == gcs_client_->client_table().GetLocalClientId()) {
-        // The actor is local. Check if the actor is still alive.
-        if (!actor_entry->second.IsAlive()) {
-          // Handle the fact that this actor is dead.
-          TreatTaskAsFailed(spec);
-        } else {
+      if (!actor_entry->second.IsAlive()) {
+        TreatTaskAsFailed(task);
+      } else {
+        // We have a known location for the actor.
+        auto node_manager_id = actor_entry->second.GetNodeManagerId();
+        if (node_manager_id == gcs_client_->client_table().GetLocalClientId()) {
           // Queue the task for local execution, bypassing placement.
           EnqueuePlaceableTask(task);
-        }
-      } else {
-        // The actor is remote. Forward the task to the node manager that owns
-        // the actor.
-        if (gcs_client_->client_table().IsRemoved(node_manager_id)) {
-          // The remote node manager is dead, so handle the fact that this actor
-          // is also dead.
-          TreatTaskAsFailed(spec);
         } else {
-          // Attempt to forward the task. If this fails to forward the task,
-          // the task will be resubmit locally.
+          // If the node manager has been removed, then it must have already been
+          // marked as DEAD in the handler for a removed GCS client.
+          RAY_CHECK(!gcs_client_->client_table().IsRemoved(node_manager_id));
+          // The actor is remote. Attempt to forward the task to the node manager
+          // that owns the actor. If this fails to forward the task, the task
+          // will be resubmitted locally.
           ForwardTaskOrResubmit(task, node_manager_id);
         }
       }
@@ -1030,7 +1149,7 @@ void NodeManager::SubmitTask(const Task &task, const Lineage &uncommitted_lineag
                                     const std::vector<ActorTableDataT> &data) {
         if (!data.empty()) {
           // The actor has been created.
-          HandleActorCreation(actor_id, data);
+          HandleActorStateTransition(actor_id, data.back());
         } else {
           // The actor has not yet been created.
           // TODO(swang): Set a timer for reconstructing the actor creation
@@ -1042,6 +1161,15 @@ void NodeManager::SubmitTask(const Task &task, const Lineage &uncommitted_lineag
       // Keep the task queued until we discover the actor's location.
       // (See design_docs/task_states.rst for the state transition diagram.)
       local_queues_.QueueMethodsWaitingForActorCreation({task});
+      // The actor has not yet been created and may have failed. To make sure
+      // that the actor is eventually recreated, we maintain the invariant that
+      // if a task is in the MethodsWaitingForActorCreation queue, then it is
+      // subscribed to its respective actor creation task and that task only.
+      // Once the actor has been created and this method removed from the
+      // waiting queue, the caller must make the corresponding call to
+      // UnsubscribeDependencies.
+      task_dependency_manager_.SubscribeDependencies(spec.TaskId(),
+                                                     {spec.ActorCreationDummyObjectId()});
       // Mark the task as pending. It will be canceled once we discover the
       // actor's location and either execute the task ourselves or forward it
       // to another node.
@@ -1057,140 +1185,120 @@ void NodeManager::SubmitTask(const Task &task, const Lineage &uncommitted_lineag
       // (See design_docs/task_states.rst for the state transition diagram.)
       local_queues_.QueuePlaceableTasks({task});
       ScheduleTasks(cluster_resource_map_);
-      DispatchTasks();
       // TODO(atumanov): assert that !placeable.isempty() => insufficient available
       // resources locally.
     }
   }
 }
 
-void NodeManager::HandleWorkerBlocked(std::shared_ptr<Worker> worker) {
-  RAY_CHECK(worker);
-  if (worker->IsBlocked()) {
-    return;
-  }
-  // If the worker isn't already blocked, then release any CPU resources that
-  // it acquired for its assigned task while it is blocked. The resources will
-  // be acquired again once the worker is unblocked.
-  RAY_CHECK(!worker->GetAssignedTaskId().is_nil());
-  // (See design_docs/task_states.rst for the state transition diagram.)
-  const auto task = local_queues_.RemoveTask(worker->GetAssignedTaskId());
-  // Get the CPU resources required by the running task.
-  const auto required_resources = task.GetTaskSpecification().GetRequiredResources();
-  double required_cpus = required_resources.GetNumCpus();
-  const std::unordered_map<std::string, double> cpu_resources = {
-      {kCPU_ResourceLabel, required_cpus}};
-
-  // Release the CPU resources.
-  auto const cpu_resource_ids = worker->ReleaseTaskCpuResources();
-  local_available_resources_.Release(cpu_resource_ids);
-  RAY_CHECK(cluster_resource_map_[gcs_client_->client_table().GetLocalClientId()].Release(
-      ResourceSet(cpu_resources)));
-
-  // Mark the task as blocked.
-  local_queues_.QueueBlockedTasks({task});
-  worker->MarkBlocked();
-
-  DispatchTasks();
-}
-
-void NodeManager::HandleWorkerUnblocked(std::shared_ptr<Worker> worker) {
-  RAY_CHECK(worker);
-  if (!worker->IsBlocked()) {
-    return;
-  }
-
-  // (See design_docs/task_states.rst for the state transition diagram.)
-  const auto task = local_queues_.RemoveTask(worker->GetAssignedTaskId());
-  // Get the CPU resources required by the running task.
-  const auto required_resources = task.GetTaskSpecification().GetRequiredResources();
-  double required_cpus = required_resources.GetNumCpus();
-  const ResourceSet cpu_resources(
-      std::unordered_map<std::string, double>({{kCPU_ResourceLabel, required_cpus}}));
-
-  // Check if we can reacquire the CPU resources.
-  bool oversubscribed = !local_available_resources_.Contains(cpu_resources);
-
-  if (!oversubscribed) {
-    // Reacquire the CPU resources for the worker. Note that care needs to be
-    // taken if the user is using the specific CPU IDs since the IDs that we
-    // reacquire here may be different from the ones that the task started with.
-    auto const resource_ids = local_available_resources_.Acquire(cpu_resources);
-    worker->AcquireTaskCpuResources(resource_ids);
-    RAY_CHECK(
-        cluster_resource_map_[gcs_client_->client_table().GetLocalClientId()].Acquire(
-            cpu_resources));
-  } else {
-    // In this case, we simply don't reacquire the CPU resources for the worker.
-    // The worker can keep running and when the task finishes, it will simply
-    // not have any CPU resources to release.
-    RAY_LOG(WARNING)
-        << "Resources oversubscribed: "
-        << cluster_resource_map_[gcs_client_->client_table().GetLocalClientId()]
-               .GetAvailableResources()
-               .ToString();
-  }
-
-  // Mark the task as running again.
-  // (See design_docs/task_states.rst for the state transition diagram.)
-  local_queues_.QueueRunningTasks({task});
-  worker->MarkUnblocked();
-}
-
-void NodeManager::HandleClientBlocked(
-    const std::shared_ptr<LocalClientConnection> &client,
-    const std::vector<ObjectID> &required_object_ids) {
+void NodeManager::HandleTaskBlocked(const std::shared_ptr<LocalClientConnection> &client,
+                                    const std::vector<ObjectID> &required_object_ids,
+                                    const TaskID &current_task_id) {
   std::shared_ptr<Worker> worker = worker_pool_.GetRegisteredWorker(client);
   if (worker) {
-    // The client is a worker. Mark the worker as blocked. This
-    // temporarily releases any resources that the worker holds while it is
-    // blocked.
-    HandleWorkerBlocked(worker);
+    // The client is a worker. If the worker is not already blocked and the
+    // blocked task matches the one assigned to the worker, then mark the
+    // worker as blocked. This temporarily releases any resources that the
+    // worker holds while it is blocked.
+    if (!worker->IsBlocked() && current_task_id == worker->GetAssignedTaskId()) {
+      const auto task = local_queues_.RemoveTask(current_task_id);
+      local_queues_.QueueRunningTasks({task});
+      // Get the CPU resources required by the running task.
+      const auto required_resources = task.GetTaskSpecification().GetRequiredResources();
+      double required_cpus = required_resources.GetNumCpus();
+      const std::unordered_map<std::string, double> cpu_resources = {
+          {kCPU_ResourceLabel, required_cpus}};
+
+      // Release the CPU resources.
+      auto const cpu_resource_ids = worker->ReleaseTaskCpuResources();
+      local_available_resources_.Release(cpu_resource_ids);
+      RAY_CHECK(
+          cluster_resource_map_[gcs_client_->client_table().GetLocalClientId()].Release(
+              ResourceSet(cpu_resources)));
+      worker->MarkBlocked();
+
+      // Try dispatching tasks since we may have released some resources.
+      DispatchTasks(local_queues_.GetReadyQueue().GetTasksWithResources());
+    }
   } else {
-    // The client is a driver. Drivers do not hold resources, so we simply
-    // mark the driver as blocked.
+    // The client is a driver. Drivers do not hold resources, so we simply mark
+    // the task as blocked.
     worker = worker_pool_.GetRegisteredDriver(client);
-    RAY_CHECK(worker);
-    worker->MarkBlocked();
   }
-  const TaskID current_task_id = worker->GetAssignedTaskId();
-  RAY_CHECK(!current_task_id.is_nil());
+
+  RAY_CHECK(worker);
+  // Mark the task as blocked.
+  worker->AddBlockedTaskId(current_task_id);
+  if (local_queues_.GetBlockedTaskIds().count(current_task_id) == 0) {
+    local_queues_.AddBlockedTaskId(current_task_id);
+  }
+
   // Subscribe to the objects required by the ray.get. These objects will
   // be fetched and/or reconstructed as necessary, until the objects become
   // local or are unsubscribed.
   task_dependency_manager_.SubscribeDependencies(current_task_id, required_object_ids);
 }
 
-void NodeManager::HandleClientUnblocked(
-    const std::shared_ptr<LocalClientConnection> &client) {
+void NodeManager::HandleTaskUnblocked(
+    const std::shared_ptr<LocalClientConnection> &client, const TaskID &current_task_id) {
   std::shared_ptr<Worker> worker = worker_pool_.GetRegisteredWorker(client);
 
-  // Re-acquire the CPU resources for the task that was assigned to the
-  // unblocked worker.
   // TODO(swang): Because the object dependencies are tracked in the task
   // dependency manager, we could actually remove this message entirely and
   // instead unblock the worker once all the objects become available.
-  bool was_blocked;
   if (worker) {
-    was_blocked = worker->IsBlocked();
-    // Mark the worker as unblocked. This returns the temporarily released
-    // resources to the worker.
-    HandleWorkerUnblocked(worker);
+    // The client is a worker. If the worker is not already unblocked and the
+    // unblocked task matches the one assigned to the worker, then mark the
+    // worker as unblocked. This returns the temporarily released resources to
+    // the worker.
+    if (worker->IsBlocked() && current_task_id == worker->GetAssignedTaskId()) {
+      // (See design_docs/task_states.rst for the state transition diagram.)
+      const auto task = local_queues_.RemoveTask(current_task_id);
+      local_queues_.QueueRunningTasks({task});
+      // Get the CPU resources required by the running task.
+      const auto required_resources = task.GetTaskSpecification().GetRequiredResources();
+      double required_cpus = required_resources.GetNumCpus();
+      const ResourceSet cpu_resources(
+          std::unordered_map<std::string, double>({{kCPU_ResourceLabel, required_cpus}}));
+
+      // Check if we can reacquire the CPU resources.
+      bool oversubscribed = !local_available_resources_.Contains(cpu_resources);
+
+      if (!oversubscribed) {
+        // Reacquire the CPU resources for the worker. Note that care needs to be
+        // taken if the user is using the specific CPU IDs since the IDs that we
+        // reacquire here may be different from the ones that the task started with.
+        auto const resource_ids = local_available_resources_.Acquire(cpu_resources);
+        worker->AcquireTaskCpuResources(resource_ids);
+        RAY_CHECK(
+            cluster_resource_map_[gcs_client_->client_table().GetLocalClientId()].Acquire(
+                cpu_resources));
+      } else {
+        // In this case, we simply don't reacquire the CPU resources for the worker.
+        // The worker can keep running and when the task finishes, it will simply
+        // not have any CPU resources to release.
+        RAY_LOG(WARNING)
+            << "Resources oversubscribed: "
+            << cluster_resource_map_[gcs_client_->client_table().GetLocalClientId()]
+                   .GetAvailableResources()
+                   .ToString();
+      }
+      worker->MarkUnblocked();
+    }
   } else {
     // The client is a driver. Drivers do not hold resources, so we simply
     // mark the driver as unblocked.
     worker = worker_pool_.GetRegisteredDriver(client);
-    RAY_CHECK(worker);
-    was_blocked = worker->IsBlocked();
-    worker->MarkUnblocked();
   }
+
+  RAY_CHECK(worker);
+  // If the task was previously blocked, then stop waiting for its dependencies
+  // and mark the task as unblocked.
+  worker->RemoveBlockedTaskId(current_task_id);
   // Unsubscribe to the objects. Any fetch or reconstruction operations to
   // make the objects local are canceled.
-  if (was_blocked) {
-    const TaskID current_task_id = worker->GetAssignedTaskId();
-    RAY_CHECK(!current_task_id.is_nil());
-    task_dependency_manager_.UnsubscribeDependencies(current_task_id);
-  }
+  RAY_CHECK(task_dependency_manager_.UnsubscribeDependencies(current_task_id));
+  local_queues_.RemoveBlockedTaskId(current_task_id);
 }
 
 void NodeManager::EnqueuePlaceableTask(const Task &task) {
@@ -1204,8 +1312,7 @@ void NodeManager::EnqueuePlaceableTask(const Task &task) {
   // (See design_docs/task_states.rst for the state transition diagram.)
   if (args_ready) {
     local_queues_.QueueReadyTasks({task});
-    // Try to dispatch the newly ready task.
-    DispatchTasks();
+    DispatchTasks(MakeTasksWithResources({task}));
   } else {
     local_queues_.QueueWaitingTasks({task});
   }
@@ -1215,14 +1322,14 @@ void NodeManager::EnqueuePlaceableTask(const Task &task) {
   task_dependency_manager_.TaskPending(task);
 }
 
-void NodeManager::AssignTask(Task &task) {
+bool NodeManager::AssignTask(const Task &task) {
   const TaskSpecification &spec = task.GetTaskSpecification();
 
   // If this is an actor task, check that the new task has the correct counter.
   if (spec.IsActorTask()) {
     if (CheckDuplicateActorTask(actor_registry_, spec)) {
-      // Drop tasks that have already been executed.
-      return;
+      // This actor has been already assigned, so ignore it.
+      return true;
     }
   }
 
@@ -1235,11 +1342,8 @@ void NodeManager::AssignTask(Task &task) {
       // Start a new worker.
       worker_pool_.StartWorkerProcess(spec.GetLanguage());
     }
-    // Queue this task for future assignment. The task will be assigned to a
-    // worker once one becomes available.
-    // (See design_docs/task_states.rst for the state transition diagram.)
-    local_queues_.QueueReadyTasks(std::vector<Task>({task}));
-    return;
+    // We couldn't assign this task, as no worker available.
+    return false;
   }
 
   RAY_LOG(DEBUG) << "Assigning task to worker with pid " << worker->Pid();
@@ -1249,10 +1353,11 @@ void NodeManager::AssignTask(Task &task) {
   auto acquired_resources =
       local_available_resources_.Acquire(spec.GetRequiredResources());
   const auto &my_client_id = gcs_client_->client_table().GetLocalClientId();
-  RAY_CHECK(
-      this->cluster_resource_map_[my_client_id].Acquire(spec.GetRequiredResources()));
+  RAY_CHECK(cluster_resource_map_[my_client_id].Acquire(spec.GetRequiredResources()));
 
   if (spec.IsActorCreationTask()) {
+    // Check that we are not placing an actor creation task on a node with 0 CPUs.
+    RAY_CHECK(cluster_resource_map_[my_client_id].GetTotalResources().GetNumCpus() != 0);
     worker->SetLifetimeResourceIds(acquired_resources);
   } else {
     worker->SetTaskResourceIds(acquired_resources);
@@ -1265,58 +1370,66 @@ void NodeManager::AssignTask(Task &task) {
   auto message = protocol::CreateGetTaskReply(fbb, spec.ToFlatbuffer(fbb),
                                               fbb.CreateVector(resource_id_set_flatbuf));
   fbb.Finish(message);
-  auto status = worker->Connection()->WriteMessage(
+  // Give the callback a copy of the task so it can modify it.
+  Task assigned_task(task);
+  worker->Connection()->WriteMessageAsync(
       static_cast<int64_t>(protocol::MessageType::ExecuteTask), fbb.GetSize(),
-      fbb.GetBufferPointer());
-  if (status.ok()) {
-    // We successfully assigned the task to the worker.
-    worker->AssignTaskId(spec.TaskId());
-    worker->AssignDriverId(spec.DriverId());
-    // If the task was an actor task, then record this execution to guarantee
-    // consistency in the case of reconstruction.
-    if (spec.IsActorTask()) {
-      auto actor_entry = actor_registry_.find(spec.ActorId());
-      RAY_CHECK(actor_entry != actor_registry_.end());
-      auto execution_dependency = actor_entry->second.GetExecutionDependency();
-      // The execution dependency is initialized to the actor creation task's
-      // return value, and is subsequently updated to the assigned tasks'
-      // return values, so it should never be nil.
-      RAY_CHECK(!execution_dependency.is_nil());
-      // Update the task's execution dependencies to reflect the actual
-      // execution order, to support deterministic reconstruction.
-      // NOTE(swang): The update of an actor task's execution dependencies is
-      // performed asynchronously. This means that if this node manager dies,
-      // we may lose updates that are in flight to the task table. We only
-      // guarantee deterministic reconstruction ordering for tasks whose
-      // updates are reflected in the task table.
-      task.SetExecutionDependencies({execution_dependency});
-      // Extend the frontier to include the executing task.
-      actor_entry->second.ExtendFrontier(spec.ActorHandleId(), spec.ActorDummyObject());
-    }
-    // We started running the task, so the task is ready to write to GCS.
-    if (!lineage_cache_.AddReadyTask(task)) {
-      RAY_LOG(WARNING)
-          << "Task " << spec.TaskId()
-          << " already in lineage cache. This is most likely due to reconstruction.";
-    }
-    // Mark the task as running.
-    // (See design_docs/task_states.rst for the state transition diagram.)
-    local_queues_.QueueRunningTasks(std::vector<Task>({task}));
-    // Notify the task dependency manager that we no longer need this task's
-    // object dependencies.
-    task_dependency_manager_.UnsubscribeDependencies(spec.TaskId());
-  } else {
-    RAY_LOG(WARNING) << "Failed to send task to worker, disconnecting client";
-    // We failed to send the task to the worker, so disconnect the worker.
-    ProcessClientMessage(worker->Connection(),
-                         static_cast<int64_t>(protocol::MessageType::DisconnectClient),
-                         nullptr);
-    // Queue this task for future assignment. The task will be assigned to a
-    // worker once one becomes available.
-    // (See design_docs/task_states.rst for the state transition diagram.)
-    local_queues_.QueueReadyTasks(std::vector<Task>({task}));
-    DispatchTasks();
-  }
+      fbb.GetBufferPointer(), [this, worker, assigned_task](ray::Status status) mutable {
+        if (status.ok()) {
+          auto spec = assigned_task.GetTaskSpecification();
+          // We successfully assigned the task to the worker.
+          worker->AssignTaskId(spec.TaskId());
+          worker->AssignDriverId(spec.DriverId());
+          // If the task was an actor task, then record this execution to guarantee
+          // consistency in the case of reconstruction.
+          if (spec.IsActorTask()) {
+            auto actor_entry = actor_registry_.find(spec.ActorId());
+            RAY_CHECK(actor_entry != actor_registry_.end());
+            auto execution_dependency = actor_entry->second.GetExecutionDependency();
+            // The execution dependency is initialized to the actor creation task's
+            // return value, and is subsequently updated to the assigned tasks'
+            // return values, so it should never be nil.
+            RAY_CHECK(!execution_dependency.is_nil());
+            // Update the task's execution dependencies to reflect the actual
+            // execution order, to support deterministic reconstruction.
+            // NOTE(swang): The update of an actor task's execution dependencies is
+            // performed asynchronously. This means that if this node manager dies,
+            // we may lose updates that are in flight to the task table. We only
+            // guarantee deterministic reconstruction ordering for tasks whose
+            // updates are reflected in the task table.
+            // (SetExecutionDependencies takes a non-const so copy task in a
+            //  on-const variable.)
+            assigned_task.SetExecutionDependencies({execution_dependency});
+          }
+          // We started running the task, so the task is ready to write to GCS.
+          if (!lineage_cache_.AddReadyTask(assigned_task)) {
+            RAY_LOG(WARNING) << "Task " << spec.TaskId() << " already in lineage cache. "
+                                                            "This is most likely due to "
+                                                            "reconstruction.";
+          }
+          // Mark the task as running.
+          // (See design_docs/task_states.rst for the state transition diagram.)
+          local_queues_.QueueRunningTasks(std::vector<Task>({assigned_task}));
+          // Notify the task dependency manager that we no longer need this task's
+          // object dependencies.
+          RAY_CHECK(task_dependency_manager_.UnsubscribeDependencies(spec.TaskId()));
+        } else {
+          RAY_LOG(WARNING) << "Failed to send task to worker, disconnecting client";
+          // We failed to send the task to the worker, so disconnect the worker.
+          ProcessDisconnectClientMessage(worker->Connection());
+          // Queue this task for future assignment. We need to do this since
+          // DispatchTasks() removed it from the ready queue. The task will be
+          // assigned to a worker once one becomes available.
+          // (See design_docs/task_states.rst for the state transition diagram.)
+          local_queues_.QueueReadyTasks({assigned_task});
+          DispatchTasks(MakeTasksWithResources({assigned_task}));
+        }
+      });
+
+  // We assigned this task to a worker.
+  // (Note this means that we sent the task to the worker. The assignment
+  //  might still fail if the worker fails in the meantime, for instance.)
+  return true;
 }
 
 void NodeManager::FinishAssignedTask(Worker &worker) {
@@ -1330,22 +1443,35 @@ void NodeManager::FinishAssignedTask(Worker &worker) {
     // If this was an actor creation task, then convert the worker to an actor.
     auto actor_id = task.GetTaskSpecification().ActorCreationId();
     worker.AssignActorId(actor_id);
+    const auto driver_id = task.GetTaskSpecification().DriverId();
 
     // Publish the actor creation event to all other nodes so that methods for
     // the actor will be forwarded directly to this node.
-    auto actor_notification = std::make_shared<ActorTableDataT>();
-    actor_notification->actor_id = actor_id.binary();
-    actor_notification->actor_creation_dummy_object_id =
+    RAY_CHECK(actor_registry_.find(actor_id) == actor_registry_.end())
+        << "Created an actor that already exists";
+    auto actor_data = std::make_shared<ActorTableDataT>();
+    actor_data->actor_id = actor_id.binary();
+    actor_data->actor_creation_dummy_object_id =
         task.GetTaskSpecification().ActorDummyObject().binary();
-    // TODO(swang): The driver ID.
-    actor_notification->driver_id = JobID::nil().binary();
-    actor_notification->node_manager_id =
-        gcs_client_->client_table().GetLocalClientId().binary();
-    auto driver_id = task.GetTaskSpecification().DriverId();
+    actor_data->driver_id = driver_id.binary();
+    actor_data->node_manager_id = gcs_client_->client_table().GetLocalClientId().binary();
+    actor_data->state = ActorState::ALIVE;
+
     RAY_LOG(DEBUG) << "Publishing actor creation: " << actor_id
                    << " driver_id: " << driver_id;
-    RAY_CHECK_OK(gcs_client_->actor_table().Append(JobID::nil(), actor_id,
-                                                   actor_notification, nullptr));
+    HandleActorStateTransition(actor_id, *actor_data);
+    // The actor should not have been created before, so writing to the first
+    // index in the log should succeed.
+    auto failure_callback = [](gcs::AsyncGcsClient *client, const ActorID &id,
+                               const ActorTableDataT &data) {
+      // TODO(swang): Instead of making this a fatal check, we could just kill
+      // the duplicate actor process. If we do this, we must make sure to
+      // either resubmit the tasks that went to the duplicate actor, or wait
+      // for success before handling the actor state transition to ALIVE.
+      RAY_LOG(FATAL) << "Failed to update state to ALIVE for actor " << id;
+    };
+    RAY_CHECK_OK(gcs_client_->actor_table().AppendAt(
+        JobID::nil(), actor_id, actor_data, nullptr, failure_callback, /*log_index=*/0));
 
     // Resources required by an actor creation task are acquired for the
     // lifetime of the actor, so we do not release any resources here.
@@ -1354,8 +1480,9 @@ void NodeManager::FinishAssignedTask(Worker &worker) {
     local_available_resources_.Release(worker.GetTaskResourceIds());
     worker.ResetTaskResourceIds();
 
-    RAY_CHECK(this->cluster_resource_map_[gcs_client_->client_table().GetLocalClientId()]
-                  .Release(task.GetTaskSpecification().GetRequiredResources()));
+    RAY_CHECK(
+        cluster_resource_map_[gcs_client_->client_table().GetLocalClientId()].Release(
+            task.GetTaskSpecification().GetRequiredResources()));
   }
 
   // If the finished task was an actor task, mark the returned dummy object as
@@ -1365,7 +1492,26 @@ void NodeManager::FinishAssignedTask(Worker &worker) {
   // removing the objects, e.g., when an actor is terminated.
   if (task.GetTaskSpecification().IsActorCreationTask() ||
       task.GetTaskSpecification().IsActorTask()) {
+    ActorID actor_id;
+    ActorHandleID actor_handle_id;
+    if (task.GetTaskSpecification().IsActorCreationTask()) {
+      actor_id = task.GetTaskSpecification().ActorCreationId();
+      actor_handle_id = ActorHandleID::nil();
+    } else {
+      actor_id = task.GetTaskSpecification().ActorId();
+      actor_handle_id = task.GetTaskSpecification().ActorHandleId();
+    }
+    auto actor_entry = actor_registry_.find(actor_id);
+    RAY_CHECK(actor_entry != actor_registry_.end());
     auto dummy_object = task.GetTaskSpecification().ActorDummyObject();
+    // Extend the actor's frontier to include the executed task.
+    actor_entry->second.ExtendFrontier(actor_handle_id, dummy_object);
+    // Mark the dummy object as locally available to indicate that the actor's
+    // state has changed and the next method can run.
+    // NOTE(swang): The dummy objects must be marked as local whenever
+    // ExtendFrontier is called, and vice versa, so that we can clean up the
+    // dummy objects properly in case the actor fails and needs to be
+    // reconstructed.
     HandleObjectLocal(dummy_object);
   }
 
@@ -1382,8 +1528,6 @@ void NodeManager::FinishAssignedTask(Worker &worker) {
 }
 
 void NodeManager::HandleTaskReconstruction(const TaskID &task_id) {
-  RAY_LOG(INFO) << "Reconstructing task " << task_id << " on client "
-                << gcs_client_->client_table().GetLocalClientId();
   // Retrieve the task spec in order to re-execute the task.
   RAY_CHECK_OK(gcs_client_->raylet_task_table().Lookup(
       JobID::nil(), task_id,
@@ -1399,7 +1543,12 @@ void NodeManager::HandleTaskReconstruction(const TaskID &task_id) {
       [this](ray::gcs::AsyncGcsClient *client, const TaskID &task_id) {
         // The task was not in the GCS task table. It must therefore be in the
         // lineage cache.
-        RAY_CHECK(lineage_cache_.ContainsTask(task_id));
+        RAY_CHECK(lineage_cache_.ContainsTask(task_id))
+            << "Task metadata not found in either GCS or lineage cache. It may have been "
+               "evicted "
+            << "by the redis LRU configuration. Consider increasing the memory "
+               "allocation via "
+            << "ray.init(redis_max_memory=<max_memory_bytes>).";
         // Use a copy of the cached task spec to re-execute the task.
         const Task task = lineage_cache_.GetTask(task_id);
         ResubmitTask(task);
@@ -1408,11 +1557,23 @@ void NodeManager::HandleTaskReconstruction(const TaskID &task_id) {
 }
 
 void NodeManager::ResubmitTask(const Task &task) {
-  // Actor reconstruction is turned off by default right now. If this is an
-  // actor task, treat the task as failed and do not resubmit it.
   if (task.GetTaskSpecification().IsActorTask()) {
-    TreatTaskAsFailed(task.GetTaskSpecification());
-    return;
+    // Actor reconstruction is turned off by default right now.
+    const ActorID actor_id = task.GetTaskSpecification().ActorId();
+    auto it = actor_registry_.find(actor_id);
+    RAY_CHECK(it != actor_registry_.end());
+    if (it->second.IsAlive()) {
+      // If the actor is still alive, then do not resubmit.
+      RAY_LOG(ERROR) << "The output of an actor task is required, but the actor may "
+                        "still be alive. If the output has been evicted, the job may "
+                        "hang.";
+      return;
+    }
+    // The actor is dead. The actor task will get resubmitted, at which point
+    // it will be treated as failed.
+  } else {
+    RAY_LOG(INFO) << "Reconstructing task " << task.GetTaskSpecification().TaskId()
+                  << " on client " << gcs_client_->client_table().GetLocalClientId();
   }
 
   // Driver tasks cannot be reconstructed. If this is a driver task, push an
@@ -1444,17 +1605,20 @@ void NodeManager::HandleObjectLocal(const ObjectID &object_id) {
   if (ready_task_ids.size() > 0) {
     std::unordered_set<TaskID> ready_task_id_set(ready_task_ids.begin(),
                                                  ready_task_ids.end());
-    // Transition tasks from waiting to scheduled.
-    // (See design_docs/task_states.rst for the state transition diagram.)
-    local_queues_.MoveTasks(ready_task_id_set, TaskState::WAITING, TaskState::READY);
-    // New ready tasks appeared in the queue, try to dispatch them.
-    DispatchTasks();
 
-    // Check that remaining tasks that could not be transitioned are blocked
-    // workers or drivers.
+    // First filter out the tasks that should not be moved to READY.
     local_queues_.FilterState(ready_task_id_set, TaskState::BLOCKED);
     local_queues_.FilterState(ready_task_id_set, TaskState::DRIVER);
-    RAY_CHECK(ready_task_id_set.empty());
+
+    // Make sure that the remaining tasks are all WAITING.
+    auto ready_task_id_set_copy = ready_task_id_set;
+    local_queues_.FilterState(ready_task_id_set_copy, TaskState::WAITING);
+    RAY_CHECK(ready_task_id_set_copy.empty());
+
+    // Queue and dispatch the tasks that are ready to run (i.e., WAITING).
+    auto ready_tasks = local_queues_.RemoveTasks(ready_task_id_set);
+    local_queues_.QueueReadyTasks(ready_tasks);
+    DispatchTasks(MakeTasksWithResources(ready_tasks));
   }
 }
 
@@ -1485,10 +1649,10 @@ void NodeManager::ForwardTaskOrResubmit(const Task &task,
                                         const ClientID &node_manager_id) {
   /// TODO(rkn): Should we check that the node manager is remote and not local?
   /// TODO(rkn): Should we check if the remote node manager is known to be dead?
-  const TaskID task_id = task.GetTaskSpecification().TaskId();
-
   // Attempt to forward the task.
-  if (!ForwardTask(task, node_manager_id).ok()) {
+  ForwardTask(task, node_manager_id, [this, task, node_manager_id](ray::Status error) {
+    const TaskID task_id = task.GetTaskSpecification().TaskId();
+
     RAY_LOG(INFO) << "Failed to forward task " << task_id << " to node manager "
                   << node_manager_id;
     // Mark the failed task as pending to let other raylets know that we still
@@ -1513,8 +1677,8 @@ void NodeManager::ForwardTaskOrResubmit(const Task &task,
             // Timer killing will receive the boost::asio::error::operation_aborted,
             // we only handle the timeout event.
             RAY_CHECK(!error);
-            RAY_LOG(DEBUG) << "Resubmitting task " << task_id
-                           << " because ForwardTask failed.";
+            RAY_LOG(INFO) << "Resubmitting task " << task_id
+                          << " because ForwardTask failed.";
             SubmitTask(task, Lineage());
           });
       // Remove the task from the lineage cache. The task will get added back
@@ -1525,12 +1689,12 @@ void NodeManager::ForwardTaskOrResubmit(const Task &task,
       // node immediately. Send it to the scheduling policy to be placed again.
       local_queues_.QueuePlaceableTasks({task});
       ScheduleTasks(cluster_resource_map_);
-      DispatchTasks();
     }
-  }
+  });
 }
 
-ray::Status NodeManager::ForwardTask(const Task &task, const ClientID &node_id) {
+void NodeManager::ForwardTask(const Task &task, const ClientID &node_id,
+                              const std::function<void(const ray::Status &)> &on_error) {
   const auto &spec = task.GetTaskSpecification();
   auto task_id = spec.TaskId();
 
@@ -1549,56 +1713,106 @@ ray::Status NodeManager::ForwardTask(const Task &task, const ClientID &node_id)
   RAY_LOG(DEBUG) << "Forwarding task " << task_id << " to " << node_id << " spillback="
                  << lineage_cache_entry_task.GetTaskExecutionSpec().NumForwards();
 
-  auto client_info = gcs_client_->client_table().GetClient(node_id);
-
   // Lookup remote server connection for this node_id and use it to send the request.
   auto it = remote_server_connections_.find(node_id);
   if (it == remote_server_connections_.end()) {
     // TODO(atumanov): caller must handle failure to ensure tasks are not lost.
     RAY_LOG(INFO) << "No NodeManager connection found for GCS client id " << node_id;
-    return ray::Status::IOError("NodeManager connection not found");
+    on_error(ray::Status::IOError("NodeManager connection not found"));
+    return;
   }
 
   auto &server_conn = it->second;
-  auto status = server_conn.WriteMessage(
+  server_conn->WriteMessageAsync(
       static_cast<int64_t>(protocol::MessageType::ForwardTaskRequest), fbb.GetSize(),
-      fbb.GetBufferPointer());
-  if (status.ok()) {
-    // If we were able to forward the task, remove the forwarded task from the
-    // lineage cache since the receiving node is now responsible for writing
-    // the task to the GCS.
-    if (!lineage_cache_.RemoveWaitingTask(task_id)) {
-      RAY_LOG(WARNING) << "Task " << task_id << " already removed from the lineage "
-                                                "cache. This is most likely due to "
-                                                "reconstruction.";
-    }
-    // Mark as forwarded so that the task and its lineage is not re-forwarded
-    // in the future to the receiving node.
-    lineage_cache_.MarkTaskAsForwarded(task_id, node_id);
-
-    // Notify the task dependency manager that we are no longer responsible
-    // for executing this task.
-    task_dependency_manager_.TaskCanceled(task_id);
-    // Preemptively push any local arguments to the receiving node. For now, we
-    // only do this with actor tasks, since actor tasks must be executed by a
-    // specific process and therefore have affinity to the receiving node.
-    if (spec.IsActorTask()) {
-      // Iterate through the object's arguments. NOTE(swang): We do not include
-      // the execution dependencies here since those cannot be transferred
-      // between nodes.
-      for (int i = 0; i < spec.NumArgs(); ++i) {
-        int count = spec.ArgIdCount(i);
-        for (int j = 0; j < count; j++) {
-          ObjectID argument_id = spec.ArgId(i, j);
-          // If the argument is local, then push it to the receiving node.
-          if (task_dependency_manager_.CheckObjectLocal(argument_id)) {
-            object_manager_.Push(argument_id, node_id);
+      fbb.GetBufferPointer(),
+      [this, on_error, task_id, node_id, spec](ray::Status status) {
+        if (status.ok()) {
+          // If we were able to forward the task, remove the forwarded task from the
+          // lineage cache since the receiving node is now responsible for writing
+          // the task to the GCS.
+          if (!lineage_cache_.RemoveWaitingTask(task_id)) {
+            RAY_LOG(WARNING) << "Task " << task_id << " already removed from the lineage "
+                                                      "cache. This is most likely due to "
+                                                      "reconstruction.";
           }
+          // Mark as forwarded so that the task and its lineage is not re-forwarded
+          // in the future to the receiving node.
+          lineage_cache_.MarkTaskAsForwarded(task_id, node_id);
+
+          // Notify the task dependency manager that we are no longer responsible
+          // for executing this task.
+          task_dependency_manager_.TaskCanceled(task_id);
+          // Preemptively push any local arguments to the receiving node. For now, we
+          // only do this with actor tasks, since actor tasks must be executed by a
+          // specific process and therefore have affinity to the receiving node.
+          if (spec.IsActorTask()) {
+            // Iterate through the object's arguments. NOTE(swang): We do not include
+            // the execution dependencies here since those cannot be transferred
+            // between nodes.
+            for (int i = 0; i < spec.NumArgs(); ++i) {
+              int count = spec.ArgIdCount(i);
+              for (int j = 0; j < count; j++) {
+                ObjectID argument_id = spec.ArgId(i, j);
+                // If the argument is local, then push it to the receiving node.
+                if (task_dependency_manager_.CheckObjectLocal(argument_id)) {
+                  object_manager_.Push(argument_id, node_id);
+                }
+              }
+            }
+          }
+        } else {
+          on_error(status);
         }
-      }
+      });
+}
+
+void NodeManager::DumpDebugState() {
+  std::fstream fs;
+  fs.open(temp_dir_ + "/debug_state.txt", std::fstream::out | std::fstream::trunc);
+  fs << DebugString();
+  fs.close();
+}
+
+std::string NodeManager::DebugString() const {
+  std::stringstream result;
+  uint64_t now_ms = current_time_ms();
+  result << "NodeManager:";
+  result << "\nLocalResources: " << local_resources_.DebugString();
+  result << "\nClusterResources:";
+  for (auto &pair : cluster_resource_map_) {
+    result << "\n" << pair.first.hex() << ": " << pair.second.DebugString();
+  }
+  result << "\n" << object_manager_.DebugString();
+  result << "\n" << gcs_client_->DebugString();
+  result << "\n" << worker_pool_.DebugString();
+  result << "\n" << local_queues_.DebugString();
+  result << "\n" << reconstruction_policy_.DebugString();
+  result << "\n" << task_dependency_manager_.DebugString();
+  result << "\n" << lineage_cache_.DebugString();
+  result << "\nActorRegistry:";
+  int live_actors = 0;
+  int dead_actors = 0;
+  int max_num_handles = 0;
+  for (auto &pair : actor_registry_) {
+    if (pair.second.IsAlive()) {
+      live_actors += 1;
+    } else {
+      dead_actors += 1;
     }
+    if (pair.second.NumHandles() > max_num_handles) {
+      max_num_handles = pair.second.NumHandles();
+    }
+  }
+  result << "\n- num live actors: " << live_actors;
+  result << "\n- num dead actors: " << dead_actors;
+  result << "\n- max num handles: " << max_num_handles;
+  result << "\nRemoteConnections:";
+  for (auto &pair : remote_server_connections_) {
+    result << "\n" << pair.first.hex() << ": " << pair.second->DebugString();
   }
-  return status;
+  result << "\nDebugString() time ms: " << (current_time_ms() - now_ms);
+  return result.str();
 }
 
 }  // namespace raylet
diff --git a/src/ray/raylet/node_manager.h b/src/ray/raylet/node_manager.h
index d8025a6c8520a..7fd820a5e5adc 100644
--- a/src/ray/raylet/node_manager.h
+++ b/src/ray/raylet/node_manager.h
@@ -16,6 +16,7 @@
 #include "ray/raylet/reconstruction_policy.h"
 #include "ray/raylet/task_dependency_manager.h"
 #include "ray/raylet/worker_pool.h"
+#include "ray/util/ordered_set.h"
 // clang-format on
 
 namespace ray {
@@ -23,18 +24,30 @@ namespace ray {
 namespace raylet {
 
 struct NodeManagerConfig {
+  /// The node's resource configuration.
   ResourceSet resource_config;
+  /// The port to use for listening to incoming connections. If this is 0 then
+  /// the node manager will choose its own port.
+  int node_manager_port;
+  /// The initial number of workers to create.
   int num_initial_workers;
+  /// The number of workers per process.
   int num_workers_per_process;
   /// The maximum number of workers that can be started concurrently by a
   /// worker pool.
   int maximum_startup_concurrency;
   /// The commands used to start the worker process, grouped by language.
   std::unordered_map<Language, std::vector<std::string>> worker_commands;
+  /// The time between heartbeats in milliseconds.
   uint64_t heartbeat_period_ms;
+  /// The time between debug dumps in milliseconds, or -1 to disable.
+  uint64_t debug_dump_period_ms;
+  /// the maximum lineage size.
   uint64_t max_lineage_size;
   /// The store socket name.
   std::string store_socket_name;
+  /// The path to the ray temp dir.
+  std::string temp_dir;
 };
 
 class NodeManager {
@@ -84,6 +97,11 @@ class NodeManager {
   /// \return Status indicating whether this was done successfully or not.
   ray::Status RegisterGcs();
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  private:
   /// Methods for handling clients.
 
@@ -96,16 +114,28 @@ class NodeManager {
   /// \param client_data Data associated with the removed client.
   /// \return Void.
   void ClientRemoved(const ClientTableDataT &client_data);
+
   /// Send heartbeats to the GCS.
   void Heartbeat();
+
+  /// Write out debug state to a file.
+  void DumpDebugState();
+
+  /// Get profiling information from the object manager and push it to the GCS.
+  ///
+  /// \return Void.
+  void GetObjectManagerProfileInfo();
+
   /// Handler for a heartbeat notification from the GCS.
   ///
-  /// \param client The GCS client.
   /// \param id The ID of the node manager that sent the heartbeat.
   /// \param data The heartbeat data including load information.
   /// \return Void.
-  void HeartbeatAdded(gcs::AsyncGcsClient *client, const ClientID &id,
-                      const HeartbeatTableDataT &data);
+  void HeartbeatAdded(const ClientID &id, const HeartbeatTableDataT &data);
+  /// Handler for a heartbeat batch notification from the GCS
+  ///
+  /// \param heartbeat_batch The batch of heartbeat data.
+  void HeartbeatBatchAdded(const HeartbeatBatchTableDataT &heartbeat_batch);
 
   /// Methods for task scheduling.
 
@@ -115,14 +145,17 @@ class NodeManager {
   /// \param task The task in question.
   /// \return Void.
   void EnqueuePlaceableTask(const Task &task);
-  /// This will treat the task as if it had been executed and failed. This is
-  /// done by looping over the task return IDs and for each ID storing an object
-  /// that represents a failure in the object store. When clients retrieve these
-  /// objects, they will raise application-level exceptions.
+  /// This will treat a task removed from the local queue as if it had been
+  /// executed and failed. This is done by looping over the task return IDs and
+  /// for each ID storing an object that represents a failure in the object
+  /// store. When clients retrieve these objects, they will raise
+  /// application-level exceptions. State for the task will be cleaned up as if
+  /// it were any other task that had been assigned, executed, and removed from
+  /// the local queue.
   ///
   /// \param spec The specification of the task.
   /// \return Void.
-  void TreatTaskAsFailed(const TaskSpecification &spec);
+  void TreatTaskAsFailed(const Task &task);
   /// Handle specified task's submission to the local node manager.
   ///
   /// \param task The task being submitted.
@@ -135,8 +168,8 @@ class NodeManager {
   /// Assign a task. The task is assumed to not be queued in local_queues_.
   ///
   /// \param task The task in question.
-  /// \return Void.
-  void AssignTask(Task &task);
+  /// \return true, if tasks was assigned to a worker, false otherwise.
+  bool AssignTask(const Task &task);
   /// Handle a worker finishing its assigned task.
   ///
   /// \param The worker that fiished the task.
@@ -174,40 +207,52 @@ class NodeManager {
   ///
   /// \param task The task to forward.
   /// \param node_id The ID of the node to forward the task to.
-  /// \return A status indicating whether the forward succeeded or not. Note
-  /// that a status of OK is not a reliable indicator that the forward succeeded
-  /// or even that the remote node is still alive.
-  ray::Status ForwardTask(const Task &task, const ClientID &node_id);
+  /// \param on_error Callback on run on non-ok status.
+  void ForwardTask(const Task &task, const ClientID &node_id,
+                   const std::function<void(const ray::Status &)> &on_error);
+
   /// Dispatch locally scheduled tasks. This attempts the transition from "scheduled" to
   /// "running" task state.
-  void DispatchTasks();
-  /// Handle a worker becoming blocked in a `ray.get`.
   ///
-  /// \param worker The worker that is blocked.
-  /// \return Void.
-  void HandleWorkerBlocked(std::shared_ptr<Worker> worker);
-  /// Handle a worker exiting a `ray.get`.
+  /// This function is called in the following cases:
+  ///   (1) A set of new tasks is added to the ready queue.
+  ///   (2) New resources are becoming available on the local node.
+  ///   (3) A new worker becomes available.
+  /// Note in case (1) we only need to look at the new tasks added to the
+  /// ready queue, as we know that the old tasks in the ready queue cannot
+  /// be scheduled (We checked those tasks last time new resources or
+  /// workers became available, and nothing changed since then.) In this case,
+  /// tasks_with_resources contains only the newly added tasks to the
+  /// ready queue. Otherwise, tasks_with_resources points to entire ready queue.
+  /// \param tasks_with_resources Mapping from resource shapes to tasks with
+  /// that resource shape.
+  void DispatchTasks(
+      const std::unordered_map<ResourceSet, ordered_set<TaskID>> &tasks_with_resources);
+
+  /// Handle a task that is blocked. This could be a task assigned to a worker,
+  /// an out-of-band task (e.g., a thread created by the application), or a
+  /// driver task. This can be triggered when a client starts a get call or a
+  /// wait call.
   ///
-  /// \param worker The worker that is unblocked.
-  /// \return Void.
-  void HandleWorkerUnblocked(std::shared_ptr<Worker> worker);
-
-  /// Handle a client that is blocked. This could be a worker or a driver. This
-  /// can be triggered when a client starts a get call or a wait call.
-  ///
-  /// \param client The client that is blocked.
+  /// \param client The client that is executing the blocked task.
   /// \param required_object_ids The IDs that the client is blocked waiting for.
+  /// \param current_task_id The task that is blocked.
   /// \return Void.
-  void HandleClientBlocked(const std::shared_ptr<LocalClientConnection> &client,
-                           const std::vector<ObjectID> &required_object_ids);
+  void HandleTaskBlocked(const std::shared_ptr<LocalClientConnection> &client,
+                         const std::vector<ObjectID> &required_object_ids,
+                         const TaskID &current_task_id);
 
-  /// Handle a client that is unblocked. This could be a worker or a driver.
-  /// This can be triggered when a client is finished with a get call or a wait
-  /// call. It is ok to call this even if the client is not actually blocked.
+  /// Handle a task that is unblocked. This could be a task assigned to a
+  /// worker, an out-of-band task (e.g., a thread created by the application),
+  /// or a driver task. This can be triggered when a client finishes a get call
+  /// or a wait call. The given task must be blocked, via a previous call to
+  /// HandleTaskBlocked.
   ///
-  /// \param client The client that is unblocked.
+  /// \param client The client that is executing the unblocked task.
+  /// \param current_task_id The task that is unblocked.
   /// \return Void.
-  void HandleClientUnblocked(const std::shared_ptr<LocalClientConnection> &client);
+  void HandleTaskUnblocked(const std::shared_ptr<LocalClientConnection> &client,
+                           const TaskID &current_task_id);
 
   /// Kill a worker.
   ///
@@ -216,20 +261,21 @@ class NodeManager {
   void KillWorker(std::shared_ptr<Worker> worker);
 
   /// Methods for actor scheduling.
-  /// Handler for the creation of an actor, possibly on a remote node.
+  /// Handler for an actor state transition, for a newly created actor or an
+  /// actor that died. This method is idempotent and will ignore old state
+  /// transitions.
   ///
   /// \param actor_id The actor ID of the actor that was created.
-  /// \param data Data associated with the actor creation event.
+  /// \param data Data associated with the actor state transition.
   /// \return Void.
-  void HandleActorCreation(const ActorID &actor_id,
-                           const std::vector<ActorTableDataT> &data);
+  void HandleActorStateTransition(const ActorID &actor_id, const ActorTableDataT &data);
 
-  /// When an actor dies, loop over all of the queued tasks for that actor and
-  /// treat them as failed.
+  /// Handler for an actor dying. The actor may be remote.
   ///
-  /// \param actor_id The actor that died.
+  /// \param actor_id The actor ID of the actor that died.
+  /// \param was_local Whether the actor was local.
   /// \return Void.
-  void CleanUpTasksForDeadActor(const ActorID &actor_id);
+  void HandleDisconnectedActor(const ActorID &actor_id, bool was_local);
 
   /// When a driver dies, loop over all of the queued tasks for that driver and
   /// treat them as failed.
@@ -267,7 +313,7 @@ class NodeManager {
   bool CheckDependencyManagerInvariant() const;
 
   /// Process client message of RegisterClientRequest
-  //
+  ///
   /// \param client The client that sent the message.
   /// \param message_data A pointer to the message data.
   /// \return Void.
@@ -275,34 +321,38 @@ class NodeManager {
       const std::shared_ptr<LocalClientConnection> &client, const uint8_t *message_data);
 
   /// Process client message of GetTask
-  //
+  ///
   /// \param client The client that sent the message.
   /// \return Void.
   void ProcessGetTaskMessage(const std::shared_ptr<LocalClientConnection> &client);
 
-  /// Process client message of DisconnectClient
-  //
+  /// Handle a client that has disconnected. This can be called multiple times
+  /// on the same client because this is triggered both when a client
+  /// disconnects and when the node manager fails to write a message to the
+  /// client.
+  ///
   /// \param client The client that sent the message.
+  /// \param push_warning Propogate error message if true.
   /// \return Void.
   void ProcessDisconnectClientMessage(
-      const std::shared_ptr<LocalClientConnection> &client);
+      const std::shared_ptr<LocalClientConnection> &client, bool push_warning = true);
 
   /// Process client message of SubmitTask
-  //
+  ///
   /// \param message_data A pointer to the message data.
   /// \return Void.
   void ProcessSubmitTaskMessage(const uint8_t *message_data);
 
-  /// Process client message of ReconstructObjects
-  //
+  /// Process client message of FetchOrReconstruct
+  ///
   /// \param client The client that sent the message.
   /// \param message_data A pointer to the message data.
   /// \return Void.
-  void ProcessReconstructObjectsMessage(
+  void ProcessFetchOrReconstructMessage(
       const std::shared_ptr<LocalClientConnection> &client, const uint8_t *message_data);
 
   /// Process client message of WaitRequest
-  //
+  ///
   /// \param client The client that sent the message.
   /// \param message_data A pointer to the message data.
   /// \return Void.
@@ -310,7 +360,7 @@ class NodeManager {
                                  const uint8_t *message_data);
 
   /// Process client message of PushErrorRequest
-  //
+  ///
   /// \param message_data A pointer to the message data.
   /// \return Void.
   void ProcessPushErrorRequestMessage(const uint8_t *message_data);
@@ -327,9 +377,18 @@ class NodeManager {
   boost::asio::steady_timer heartbeat_timer_;
   /// The period used for the heartbeat timer.
   std::chrono::milliseconds heartbeat_period_;
+  /// The period between debug state dumps.
+  int64_t debug_dump_period_;
+  /// The path to the ray temp dir.
+  std::string temp_dir_;
+  /// The timer used to get profiling information from the object manager and
+  /// push it to the GCS.
+  boost::asio::steady_timer object_manager_profile_timer_;
   /// The time that the last heartbeat was sent at. Used to make sure we are
   /// keeping up with heartbeats.
   uint64_t last_heartbeat_at_ms_;
+  /// The time that the last debug string was logged to the console.
+  uint64_t last_debug_dump_at_ms_;
   /// The resources local to this node.
   const SchedulingResources local_resources_;
   /// The resources (and specific resource IDs) that are currently available.
@@ -348,7 +407,8 @@ class NodeManager {
   /// The lineage cache for the GCS object and task tables.
   LineageCache lineage_cache_;
   std::vector<ClientID> remote_clients_;
-  std::unordered_map<ClientID, TcpServerConnection> remote_server_connections_;
+  std::unordered_map<ClientID, std::shared_ptr<TcpServerConnection>>
+      remote_server_connections_;
   /// A mapping from actor ID to registration information about that actor
   /// (including which node manager owns it).
   std::unordered_map<ActorID, ActorRegistration> actor_registry_;
diff --git a/src/ray/raylet/object_manager_integration_test.cc b/src/ray/raylet/object_manager_integration_test.cc
index 5fe7f774b6255..83c7a9f8f8be7 100644
--- a/src/ray/raylet/object_manager_integration_test.cc
+++ b/src/ray/raylet/object_manager_integration_test.cc
@@ -60,7 +60,7 @@ class TestObjectManagerBase : public ::testing::Test {
     om_config_1.store_socket_name = store_sock_1;
     om_config_1.push_timeout_ms = 10000;
     server1.reset(new ray::raylet::Raylet(
-        main_service, "raylet_1", "0.0.0.0", "127.0.0.1", 6379,
+        main_service, "raylet_1", "0.0.0.0", "127.0.0.1", 6379, "",
         GetNodeManagerConfig("raylet_1", store_sock_1), om_config_1, gcs_client_1));
 
     // start second server
@@ -70,7 +70,7 @@ class TestObjectManagerBase : public ::testing::Test {
     om_config_2.store_socket_name = store_sock_2;
     om_config_2.push_timeout_ms = 10000;
     server2.reset(new ray::raylet::Raylet(
-        main_service, "raylet_2", "0.0.0.0", "127.0.0.1", 6379,
+        main_service, "raylet_2", "0.0.0.0", "127.0.0.1", 6379, "",
         GetNodeManagerConfig("raylet_2", store_sock_2), om_config_2, gcs_client_2));
 
     // connect to stores.
@@ -155,7 +155,7 @@ class TestObjectManagerIntegration : public TestObjectManagerBase {
   void AddTransferTestHandlers() {
     ray::Status status = ray::Status::OK();
     status = server1->object_manager_.SubscribeObjAdded(
-        [this](const ObjectInfoT &object_info) {
+        [this](const object_manager::protocol::ObjectInfoT &object_info) {
           v1.push_back(ObjectID::from_binary(object_info.object_id));
           if (v1.size() == num_expected_objects && v1.size() == v2.size()) {
             TestPushComplete();
@@ -163,7 +163,7 @@ class TestObjectManagerIntegration : public TestObjectManagerBase {
         });
     RAY_CHECK_OK(status);
     status = server2->object_manager_.SubscribeObjAdded(
-        [this](const ObjectInfoT &object_info) {
+        [this](const object_manager::protocol::ObjectInfoT &object_info) {
           v2.push_back(ObjectID::from_binary(object_info.object_id));
           if (v2.size() == num_expected_objects && v1.size() == v2.size()) {
             TestPushComplete();
@@ -204,12 +204,14 @@ class TestObjectManagerIntegration : public TestObjectManagerBase {
     RAY_LOG(INFO) << "\n"
                   << "All connected clients:"
                   << "\n";
-    const ClientTableDataT &data = gcs_client_2->client_table().GetClient(client_id_1);
+    ClientTableDataT data;
+    gcs_client_2->client_table().GetClient(client_id_1, data);
     RAY_LOG(INFO) << (ClientID::from_binary(data.client_id) == ClientID::nil());
     RAY_LOG(INFO) << "ClientID=" << ClientID::from_binary(data.client_id);
     RAY_LOG(INFO) << "ClientIp=" << data.node_manager_address;
     RAY_LOG(INFO) << "ClientPort=" << data.node_manager_port;
-    const ClientTableDataT &data2 = gcs_client_1->client_table().GetClient(client_id_2);
+    ClientTableDataT data2;
+    gcs_client_1->client_table().GetClient(client_id_2, data2);
     RAY_LOG(INFO) << "ClientID=" << ClientID::from_binary(data2.client_id);
     RAY_LOG(INFO) << "ClientIp=" << data2.node_manager_address;
     RAY_LOG(INFO) << "ClientPort=" << data2.node_manager_port;
diff --git a/src/ray/raylet/raylet.cc b/src/ray/raylet/raylet.cc
index df30498f4215c..679b18052920b 100644
--- a/src/ray/raylet/raylet.cc
+++ b/src/ray/raylet/raylet.cc
@@ -13,7 +13,8 @@ namespace raylet {
 
 Raylet::Raylet(boost::asio::io_service &main_service, const std::string &socket_name,
                const std::string &node_ip_address, const std::string &redis_address,
-               int redis_port, const NodeManagerConfig &node_manager_config,
+               int redis_port, const std::string &redis_password,
+               const NodeManagerConfig &node_manager_config,
                const ObjectManagerConfig &object_manager_config,
                std::shared_ptr<gcs::AsyncGcsClient> gcs_client)
     : gcs_client_(gcs_client),
@@ -23,19 +24,22 @@ Raylet::Raylet(boost::asio::io_service &main_service, const std::string &socket_
       acceptor_(main_service, boost::asio::local::stream_protocol::endpoint(socket_name)),
       socket_(main_service),
       object_manager_acceptor_(
-          main_service, boost::asio::ip::tcp::endpoint(boost::asio::ip::tcp::v4(), 0)),
+          main_service,
+          boost::asio::ip::tcp::endpoint(boost::asio::ip::tcp::v4(),
+                                         object_manager_config.object_manager_port)),
       object_manager_socket_(main_service),
-      node_manager_acceptor_(
-          main_service, boost::asio::ip::tcp::endpoint(boost::asio::ip::tcp::v4(), 0)),
+      node_manager_acceptor_(main_service, boost::asio::ip::tcp::endpoint(
+                                               boost::asio::ip::tcp::v4(),
+                                               node_manager_config.node_manager_port)),
       node_manager_socket_(main_service) {
   // Start listening for clients.
   DoAccept();
   DoAcceptObjectManager();
   DoAcceptNodeManager();
 
-  RAY_CHECK_OK(RegisterGcs(node_ip_address, socket_name_,
-                           object_manager_config.store_socket_name, redis_address,
-                           redis_port, main_service, node_manager_config));
+  RAY_CHECK_OK(RegisterGcs(
+      node_ip_address, socket_name_, object_manager_config.store_socket_name,
+      redis_address, redis_port, redis_password, main_service, node_manager_config));
 
   RAY_CHECK_OK(RegisterPeriodicTimer(main_service));
 }
@@ -52,6 +56,7 @@ ray::Status Raylet::RegisterGcs(const std::string &node_ip_address,
                                 const std::string &raylet_socket_name,
                                 const std::string &object_store_socket_name,
                                 const std::string &redis_address, int redis_port,
+                                const std::string &redis_password,
                                 boost::asio::io_service &io_service,
                                 const NodeManagerConfig &node_manager_config) {
   RAY_RETURN_NOT_OK(gcs_client_->Attach(io_service));
diff --git a/src/ray/raylet/raylet.h b/src/ray/raylet/raylet.h
index be634616b008b..9b424781af171 100644
--- a/src/ray/raylet/raylet.h
+++ b/src/ray/raylet/raylet.h
@@ -29,6 +29,7 @@ class Raylet {
   /// \param node_ip_address The IP address of this node.
   /// \param redis_address The IP address of the redis instance we are connecting to.
   /// \param redis_port The port of the redis instance we are connecting to.
+  /// \param redis_password The password of the redis instance we are connecting to.
   /// \param node_manager_config Configuration to initialize the node manager.
   /// scheduler with.
   /// \param object_manager_config Configuration to initialize the object
@@ -36,7 +37,8 @@ class Raylet {
   /// \param gcs_client A client connection to the GCS.
   Raylet(boost::asio::io_service &main_service, const std::string &socket_name,
          const std::string &node_ip_address, const std::string &redis_address,
-         int redis_port, const NodeManagerConfig &node_manager_config,
+         int redis_port, const std::string &redis_password,
+         const NodeManagerConfig &node_manager_config,
          const ObjectManagerConfig &object_manager_config,
          std::shared_ptr<gcs::AsyncGcsClient> gcs_client);
 
@@ -49,6 +51,7 @@ class Raylet {
                           const std::string &raylet_socket_name,
                           const std::string &object_store_socket_name,
                           const std::string &redis_address, int redis_port,
+                          const std::string &redis_password,
                           boost::asio::io_service &io_service, const NodeManagerConfig &);
 
   ray::Status RegisterPeriodicTimer(boost::asio::io_service &io_service);
diff --git a/src/ray/raylet/reconstruction_policy.cc b/src/ray/raylet/reconstruction_policy.cc
index c14dd34a023a0..6abf5b53d8246 100644
--- a/src/ray/raylet/reconstruction_policy.cc
+++ b/src/ray/raylet/reconstruction_policy.cc
@@ -203,6 +203,13 @@ void ReconstructionPolicy::Cancel(const ObjectID &object_id) {
   }
 }
 
+std::string ReconstructionPolicy::DebugString() const {
+  std::stringstream result;
+  result << "ReconstructionPolicy:";
+  result << "\n- num reconstructing: " << listening_tasks_.size();
+  return result.str();
+}
+
 }  // namespace raylet
 
 }  // end namespace ray
diff --git a/src/ray/raylet/reconstruction_policy.h b/src/ray/raylet/reconstruction_policy.h
index dfa69ebf53b74..f18290aa37254 100644
--- a/src/ray/raylet/reconstruction_policy.h
+++ b/src/ray/raylet/reconstruction_policy.h
@@ -71,6 +71,11 @@ class ReconstructionPolicy : public ReconstructionPolicyInterface {
   /// this timeout, then objects that the task creates may be reconstructed.
   void HandleTaskLeaseNotification(const TaskID &task_id, int64_t lease_timeout_ms);
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  private:
   struct ReconstructionTask {
     ReconstructionTask(boost::asio::io_service &io_service)
diff --git a/src/ray/raylet/reconstruction_policy_test.cc b/src/ray/raylet/reconstruction_policy_test.cc
index 38861543d9623..9f1499c31664a 100644
--- a/src/ray/raylet/reconstruction_policy_test.cc
+++ b/src/ray/raylet/reconstruction_policy_test.cc
@@ -36,18 +36,21 @@ class MockObjectDirectory : public ObjectDirectoryInterface {
     locations_[object_id] = locations;
   }
 
+  std::string DebugString() const { return ""; }
+
   MOCK_METHOD0(RegisterBackend, void(void));
-  MOCK_METHOD3(GetInformation, ray::Status(const ClientID &, const InfoSuccessCallback &,
-                                           const InfoFailureCallback &));
+  MOCK_METHOD0(GetLocalClientID, ray::ClientID());
+  MOCK_CONST_METHOD1(LookupRemoteConnectionInfo, void(RemoteConnectionInfo &));
+  MOCK_CONST_METHOD0(LookupAllRemoteConnections, std::vector<RemoteConnectionInfo>());
   MOCK_METHOD3(SubscribeObjectLocations,
                ray::Status(const ray::UniqueID &, const ObjectID &,
                            const OnLocationsFound &));
   MOCK_METHOD2(UnsubscribeObjectLocations,
                ray::Status(const ray::UniqueID &, const ObjectID &));
   MOCK_METHOD3(ReportObjectAdded,
-               ray::Status(const ObjectID &, const ClientID &, const ObjectInfoT &));
+               ray::Status(const ObjectID &, const ClientID &,
+                           const object_manager::protocol::ObjectInfoT &));
   MOCK_METHOD2(ReportObjectRemoved, ray::Status(const ObjectID &, const ClientID &));
-  MOCK_METHOD1(RunFunctionForEachClient, void(const InfoSuccessCallback &success_cb));
 
  private:
   std::vector<std::pair<ObjectID, OnLocationsFound>> callbacks_;
diff --git a/src/ray/raylet/scheduling_policy.cc b/src/ray/raylet/scheduling_policy.cc
index 0ed4efb273358..177d2fd806c89 100644
--- a/src/ray/raylet/scheduling_policy.cc
+++ b/src/ray/raylet/scheduling_policy.cc
@@ -1,6 +1,8 @@
-#include "scheduling_policy.h"
-
+#include <algorithm>
 #include <chrono>
+#include <random>
+
+#include "scheduling_policy.h"
 
 #include "ray/util/logging.h"
 
@@ -35,12 +37,9 @@ std::unordered_map<TaskID, ClientID> SchedulingPolicy::Schedule(
   // Iterate over running tasks, get their resource demand and try to schedule.
   for (const auto &t : scheduling_queue_.GetPlaceableTasks()) {
     // Get task's resource demand
-    const auto &resource_demand = t.GetTaskSpecification().GetRequiredResources();
-    const TaskID &task_id = t.GetTaskSpecification().TaskId();
-    RAY_LOG(DEBUG) << "[SchedulingPolicy]: task=" << task_id
-                   << " numforwards=" << t.GetTaskExecutionSpec().NumForwards()
-                   << " resources="
-                   << t.GetTaskSpecification().GetRequiredResources().ToString();
+    const auto &spec = t.GetTaskSpecification();
+    const auto &resource_demand = spec.GetRequiredPlacementResources();
+    const TaskID &task_id = spec.TaskId();
 
     // TODO(atumanov): try to place tasks locally first.
     // Construct a set of viable node candidates and randomly pick between them.
@@ -97,7 +96,7 @@ std::unordered_map<TaskID, ClientID> SchedulingPolicy::Schedule(
         std::uniform_int_distribution<int> distribution(0, client_keys.size() - 1);
         int client_key_index = distribution(gen_);
         const ClientID &dst_client_id = client_keys[client_key_index];
-        decision[t.GetTaskSpecification().TaskId()] = dst_client_id;
+        decision[task_id] = dst_client_id;
         // Update dst_client_id's load to keep track of remote task load until
         // the next heartbeat.
         ResourceSet new_load(cluster_resources[dst_client_id].GetLoadResources());
@@ -107,9 +106,11 @@ std::unordered_map<TaskID, ClientID> SchedulingPolicy::Schedule(
         // There are no nodes that can feasibly execute this task. The task remains
         // placeable until cluster capacity becomes available.
         // TODO(rkn): Propagate a warning to the user.
-        RAY_LOG(INFO) << "This task requires "
-                      << t.GetTaskSpecification().GetRequiredResources().ToString()
-                      << ", but no nodes have the necessary resources.";
+        RAY_LOG(INFO) << "The task with ID " << task_id << " requires "
+                      << spec.GetRequiredResources().ToString() << " for execution and "
+                      << spec.GetRequiredPlacementResources().ToString()
+                      << " for placement, but no nodes have the necessary resources. "
+                      << "Check the client table to view node resources.";
       }
     }
   }
@@ -124,21 +125,25 @@ std::vector<TaskID> SchedulingPolicy::SpillOver(
 
   ResourceSet new_load(remote_scheduling_resources.GetLoadResources());
 
-  // Check if we can accommodate an infeasible task.
+  // Check if we can accommodate infeasible tasks.
   for (const auto &task : scheduling_queue_.GetInfeasibleTasks()) {
-    if (task.GetTaskSpecification().GetRequiredResources().IsSubset(
-            remote_scheduling_resources.GetTotalResources())) {
-      decision.push_back(task.GetTaskSpecification().TaskId());
-      new_load.AddResources(task.GetTaskSpecification().GetRequiredResources());
+    const auto &spec = task.GetTaskSpecification();
+    const auto &placement_resources = spec.GetRequiredPlacementResources();
+    if (placement_resources.IsSubset(remote_scheduling_resources.GetTotalResources())) {
+      decision.push_back(spec.TaskId());
+      new_load.AddResources(spec.GetRequiredResources());
     }
   }
 
+  // Try to accommodate up to a single ready task.
   for (const auto &task : scheduling_queue_.GetReadyTasks()) {
-    if (!task.GetTaskSpecification().IsActorTask()) {
-      if (task.GetTaskSpecification().GetRequiredResources().IsSubset(
-              remote_scheduling_resources.GetTotalResources())) {
-        decision.push_back(task.GetTaskSpecification().TaskId());
-        new_load.AddResources(task.GetTaskSpecification().GetRequiredResources());
+    const auto &spec = task.GetTaskSpecification();
+    if (!spec.IsActorTask()) {
+      // Make sure the node has enough available resources to prevent forwarding cycles.
+      if (spec.GetRequiredPlacementResources().IsSubset(
+              remote_scheduling_resources.GetAvailableResources())) {
+        decision.push_back(spec.TaskId());
+        new_load.AddResources(spec.GetRequiredResources());
         break;
       }
     }
diff --git a/src/ray/raylet/scheduling_policy.h b/src/ray/raylet/scheduling_policy.h
index b6dc272754131..7449f8ba0b3b1 100644
--- a/src/ray/raylet/scheduling_policy.h
+++ b/src/ray/raylet/scheduling_policy.h
@@ -36,6 +36,13 @@ class SchedulingPolicy {
       std::unordered_map<ClientID, SchedulingResources> &cluster_resources,
       const ClientID &local_client_id);
 
+  /// \brief Given a set of cluster resources perform a spill-over scheduling operation.
+  ///
+  /// \param cluster_resources: a set of cluster resources containing resource and load
+  /// information for some subset of the cluster. For all client IDs in the returned
+  /// placement map, the corresponding SchedulingResources::resources_load_ is
+  /// incremented by the aggregate resource demand of the tasks assigned to it.
+  /// \return Scheduling decision, mapping tasks to raylets for placement.
   std::vector<TaskID> SpillOver(SchedulingResources &remote_scheduling_resources) const;
 
   /// \brief SchedulingPolicy destructor.
diff --git a/src/ray/raylet/scheduling_queue.cc b/src/ray/raylet/scheduling_queue.cc
index 7943fc2e326f8..b9045e57912e1 100644
--- a/src/ray/raylet/scheduling_queue.cc
+++ b/src/ray/raylet/scheduling_queue.cc
@@ -1,17 +1,24 @@
 #include "scheduling_queue.h"
 
+#include <sstream>
+
 #include "ray/status.h"
 
 namespace {
 
 // Helper function to remove tasks in the given set of task_ids from a
 // queue, and append them to the given vector removed_tasks.
-void RemoveTasksFromQueue(ray::raylet::SchedulingQueue::TaskQueue &queue,
+template <typename TaskQueue>
+void RemoveTasksFromQueue(ray::raylet::TaskState task_state, TaskQueue &queue,
                           std::unordered_set<ray::TaskID> &task_ids,
-                          std::vector<ray::raylet::Task> &removed_tasks) {
+                          std::vector<ray::raylet::Task> *removed_tasks,
+                          std::vector<ray::raylet::TaskState> *task_states = nullptr) {
   for (auto it = task_ids.begin(); it != task_ids.end();) {
     if (queue.RemoveTask(*it, removed_tasks)) {
       it = task_ids.erase(it);
+      if (task_states != nullptr) {
+        task_states->push_back(task_state);
+      }
     } else {
       it++;
     }
@@ -19,15 +26,16 @@ void RemoveTasksFromQueue(ray::raylet::SchedulingQueue::TaskQueue &queue,
 }
 
 // Helper function to queue the given tasks to the given queue.
-inline void QueueTasks(ray::raylet::SchedulingQueue::TaskQueue &queue,
-                       const std::vector<ray::raylet::Task> &tasks) {
+template <typename TaskQueue>
+inline void QueueTasks(TaskQueue &queue, const std::vector<ray::raylet::Task> &tasks) {
   for (const auto &task : tasks) {
     queue.AppendTask(task.GetTaskSpecification().TaskId(), task);
   }
 }
 
 // Helper function to filter out tasks of a given state.
-inline void FilterStateFromQueue(const ray::raylet::SchedulingQueue::TaskQueue &queue,
+template <typename TaskQueue>
+inline void FilterStateFromQueue(const TaskQueue &queue,
                                  std::unordered_set<ray::TaskID> &task_ids,
                                  ray::raylet::TaskState filter_state) {
   for (auto it = task_ids.begin(); it != task_ids.end();) {
@@ -40,7 +48,8 @@ inline void FilterStateFromQueue(const ray::raylet::SchedulingQueue::TaskQueue &
 }
 
 // Helper function to get tasks for a driver from a given state.
-inline void GetDriverTasksFromQueue(const ray::raylet::SchedulingQueue::TaskQueue &queue,
+template <typename TaskQueue>
+inline void GetDriverTasksFromQueue(const TaskQueue &queue,
                                     const ray::DriverID &driver_id,
                                     std::unordered_set<ray::TaskID> &task_ids) {
   const auto &tasks = queue.GetTasks();
@@ -53,8 +62,8 @@ inline void GetDriverTasksFromQueue(const ray::raylet::SchedulingQueue::TaskQueu
 }
 
 // Helper function to get tasks for an actor from a given state.
-inline void GetActorTasksFromQueue(const ray::raylet::SchedulingQueue::TaskQueue &queue,
-                                   const ray::ActorID &actor_id,
+template <typename TaskQueue>
+inline void GetActorTasksFromQueue(const TaskQueue &queue, const ray::ActorID &actor_id,
                                    std::unordered_set<ray::TaskID> &task_ids) {
   const auto &tasks = queue.GetTasks();
   for (const auto &task : tasks) {
@@ -71,97 +80,93 @@ namespace ray {
 
 namespace raylet {
 
-SchedulingQueue::TaskQueue::~TaskQueue() {
-  task_map_.clear();
-  task_list_.clear();
-}
-
-bool SchedulingQueue::TaskQueue::AppendTask(const TaskID &task_id, const Task &task) {
+bool TaskQueue::AppendTask(const TaskID &task_id, const Task &task) {
   RAY_CHECK(task_map_.find(task_id) == task_map_.end());
   auto list_iterator = task_list_.insert(task_list_.end(), task);
   task_map_[task_id] = list_iterator;
+  // Resource bookkeeping
+  current_resource_load_.AddResources(task.GetTaskSpecification().GetRequiredResources());
   return true;
 }
 
-bool SchedulingQueue::TaskQueue::RemoveTask(const TaskID &task_id) {
+bool TaskQueue::RemoveTask(const TaskID &task_id, std::vector<Task> *removed_tasks) {
   auto task_found_iterator = task_map_.find(task_id);
   if (task_found_iterator == task_map_.end()) {
     return false;
   }
 
   auto list_iterator = task_found_iterator->second;
+  // Resource bookkeeping
+  current_resource_load_.SubtractResourcesStrict(
+      list_iterator->GetTaskSpecification().GetRequiredResources());
+  if (removed_tasks) {
+    removed_tasks->push_back(std::move(*list_iterator));
+  }
   task_map_.erase(task_found_iterator);
   task_list_.erase(list_iterator);
   return true;
 }
 
-bool SchedulingQueue::TaskQueue::RemoveTask(const TaskID &task_id,
-                                            std::vector<Task> &removed_tasks) {
-  auto task_found_iterator = task_map_.find(task_id);
-  if (task_found_iterator == task_map_.end()) {
-    return false;
-  }
+bool TaskQueue::HasTask(const TaskID &task_id) const {
+  return task_map_.find(task_id) != task_map_.end();
+}
 
-  auto list_iterator = task_found_iterator->second;
-  removed_tasks.push_back(std::move(*list_iterator));
-  task_map_.erase(task_found_iterator);
-  task_list_.erase(list_iterator);
-  return true;
+const std::list<Task> &TaskQueue::GetTasks() const { return task_list_; }
+
+const ResourceSet &TaskQueue::GetCurrentResourceLoad() const {
+  return current_resource_load_;
 }
 
-bool SchedulingQueue::TaskQueue::HasTask(const TaskID &task_id) const {
-  return task_map_.find(task_id) != task_map_.end();
+bool ReadyQueue::AppendTask(const TaskID &task_id, const Task &task) {
+  const auto &resources = task.GetTaskSpecification().GetRequiredResources();
+  tasks_with_resources_[resources].push_back(task_id);
+  return TaskQueue::AppendTask(task_id, task);
 }
 
-const std::list<Task> &SchedulingQueue::TaskQueue::GetTasks() const { return task_list_; }
+bool ReadyQueue::RemoveTask(const TaskID &task_id, std::vector<Task> *removed_tasks) {
+  if (task_map_.find(task_id) != task_map_.end()) {
+    const auto &resources =
+        task_map_[task_id]->GetTaskSpecification().GetRequiredResources();
+    tasks_with_resources_[resources].erase(task_id);
+  }
+  return TaskQueue::RemoveTask(task_id, removed_tasks);
+}
 
 const std::list<Task> &SchedulingQueue::GetMethodsWaitingForActorCreation() const {
-  return this->methods_waiting_for_actor_creation_.GetTasks();
+  return methods_waiting_for_actor_creation_.GetTasks();
 }
 
 const std::list<Task> &SchedulingQueue::GetWaitingTasks() const {
-  return this->waiting_tasks_.GetTasks();
+  return waiting_tasks_.GetTasks();
 }
 
 const std::list<Task> &SchedulingQueue::GetPlaceableTasks() const {
-  return this->placeable_tasks_.GetTasks();
+  return placeable_tasks_.GetTasks();
 }
 
 const std::list<Task> &SchedulingQueue::GetReadyTasks() const {
-  return this->ready_tasks_.GetTasks();
+  return ready_tasks_.GetTasks();
 }
 
 const std::list<Task> &SchedulingQueue::GetInfeasibleTasks() const {
-  return this->infeasible_tasks_.GetTasks();
-}
-
-ResourceSet SchedulingQueue::GetQueueResources(const TaskQueue &task_queue) const {
-  // Iterate over all tasks of the specified queue and aggregate total resource
-  // demand in a resource set.
-  ResourceSet queue_resources;
-  for (const auto &task : task_queue.GetTasks()) {
-    queue_resources.AddResources(task.GetTaskSpecification().GetRequiredResources());
-  }
-  return queue_resources;
+  return infeasible_tasks_.GetTasks();
 }
 
 ResourceSet SchedulingQueue::GetReadyQueueResources() const {
-  return GetQueueResources(ready_tasks_);
+  return ready_tasks_.GetCurrentResourceLoad();
 }
 
 ResourceSet SchedulingQueue::GetResourceLoad() const {
-  ResourceSet load_resource_set;
-  load_resource_set.AddResources(GetReadyQueueResources());
   // TODO(atumanov): consider other types of tasks as part of load.
-  return load_resource_set;
+  return ready_tasks_.GetCurrentResourceLoad();
 }
 
 const std::list<Task> &SchedulingQueue::GetRunningTasks() const {
-  return this->running_tasks_.GetTasks();
+  return running_tasks_.GetTasks();
 }
 
-const std::list<Task> &SchedulingQueue::GetBlockedTasks() const {
-  return this->blocked_tasks_.GetTasks();
+const std::unordered_set<TaskID> &SchedulingQueue::GetBlockedTaskIds() const {
+  return blocked_task_ids_;
 }
 
 void SchedulingQueue::FilterState(std::unordered_set<TaskID> &task_ids,
@@ -179,9 +184,16 @@ void SchedulingQueue::FilterState(std::unordered_set<TaskID> &task_ids,
   case TaskState::RUNNING:
     FilterStateFromQueue(running_tasks_, task_ids, filter_state);
     break;
-  case TaskState::BLOCKED:
-    FilterStateFromQueue(blocked_tasks_, task_ids, filter_state);
-    break;
+  case TaskState::BLOCKED: {
+    const auto blocked_ids = GetBlockedTaskIds();
+    for (auto it = task_ids.begin(); it != task_ids.end();) {
+      if (blocked_ids.count(*it) == 1) {
+        it = task_ids.erase(it);
+      } else {
+        it++;
+      }
+    }
+  } break;
   case TaskState::INFEASIBLE:
     FilterStateFromQueue(infeasible_tasks_, task_ids, filter_state);
     break;
@@ -201,26 +213,43 @@ void SchedulingQueue::FilterState(std::unordered_set<TaskID> &task_ids,
   }
 }
 
-std::vector<Task> SchedulingQueue::RemoveTasks(std::unordered_set<TaskID> &task_ids) {
+std::vector<Task> SchedulingQueue::RemoveTasks(std::unordered_set<TaskID> &task_ids,
+                                               std::vector<TaskState> *task_states) {
   // List of removed tasks to be returned.
   std::vector<Task> removed_tasks;
 
   // Try to find the tasks to remove from the queues.
-  RemoveTasksFromQueue(methods_waiting_for_actor_creation_, task_ids, removed_tasks);
-  RemoveTasksFromQueue(waiting_tasks_, task_ids, removed_tasks);
-  RemoveTasksFromQueue(placeable_tasks_, task_ids, removed_tasks);
-  RemoveTasksFromQueue(ready_tasks_, task_ids, removed_tasks);
-  RemoveTasksFromQueue(running_tasks_, task_ids, removed_tasks);
-  RemoveTasksFromQueue(blocked_tasks_, task_ids, removed_tasks);
-  RemoveTasksFromQueue(infeasible_tasks_, task_ids, removed_tasks);
+
+  RemoveTasksFromQueue(TaskState::WAITING_FOR_ACTOR, methods_waiting_for_actor_creation_,
+                       task_ids, &removed_tasks, task_states);
+  RemoveTasksFromQueue(TaskState::WAITING, waiting_tasks_, task_ids, &removed_tasks,
+                       task_states);
+  RemoveTasksFromQueue(TaskState::PLACEABLE, placeable_tasks_, task_ids, &removed_tasks,
+                       task_states);
+  RemoveTasksFromQueue(TaskState::READY, ready_tasks_, task_ids, &removed_tasks,
+                       task_states);
+  RemoveTasksFromQueue(TaskState::RUNNING, running_tasks_, task_ids, &removed_tasks,
+                       task_states);
+  RemoveTasksFromQueue(TaskState::INFEASIBLE, infeasible_tasks_, task_ids, &removed_tasks,
+                       task_states);
 
   RAY_CHECK(task_ids.size() == 0);
+  if (task_states != nullptr) {
+    RAY_CHECK(removed_tasks.size() == task_states->size());
+  }
   return removed_tasks;
 }
 
-Task SchedulingQueue::RemoveTask(const TaskID &task_id) {
+Task SchedulingQueue::RemoveTask(const TaskID &task_id, TaskState *task_state) {
   std::unordered_set<TaskID> task_id_set = {task_id};
-  auto task = RemoveTasks(task_id_set).front();
+  std::vector<TaskState> task_state_vector;
+  auto const task = RemoveTasks(task_id_set, &task_state_vector).front();
+
+  RAY_CHECK(task_state_vector.size() == 1);
+  if (task_state != nullptr) {
+    *task_state = task_state_vector[0];
+  }
+
   RAY_CHECK(task.GetTaskSpecification().TaskId() == task_id);
   return task;
 }
@@ -229,25 +258,25 @@ void SchedulingQueue::MoveTasks(std::unordered_set<TaskID> &task_ids, TaskState
                                 TaskState dst_state) {
   // TODO(atumanov): check the states first to ensure the move is transactional.
   std::vector<Task> removed_tasks;
+
   // Remove the tasks from the specified source queue.
   switch (src_state) {
   case TaskState::PLACEABLE:
-    RemoveTasksFromQueue(placeable_tasks_, task_ids, removed_tasks);
+    RemoveTasksFromQueue(TaskState::PLACEABLE, placeable_tasks_, task_ids,
+                         &removed_tasks);
     break;
   case TaskState::WAITING:
-    RemoveTasksFromQueue(waiting_tasks_, task_ids, removed_tasks);
+    RemoveTasksFromQueue(TaskState::WAITING, waiting_tasks_, task_ids, &removed_tasks);
     break;
   case TaskState::READY:
-    RemoveTasksFromQueue(ready_tasks_, task_ids, removed_tasks);
+    RemoveTasksFromQueue(TaskState::READY, ready_tasks_, task_ids, &removed_tasks);
     break;
   case TaskState::RUNNING:
-    RemoveTasksFromQueue(running_tasks_, task_ids, removed_tasks);
-    break;
-  case TaskState::BLOCKED:
-    RemoveTasksFromQueue(blocked_tasks_, task_ids, removed_tasks);
+    RemoveTasksFromQueue(TaskState::RUNNING, running_tasks_, task_ids, &removed_tasks);
     break;
   case TaskState::INFEASIBLE:
-    RemoveTasksFromQueue(infeasible_tasks_, task_ids, removed_tasks);
+    RemoveTasksFromQueue(TaskState::INFEASIBLE, infeasible_tasks_, task_ids,
+                         &removed_tasks);
     break;
   default:
     RAY_LOG(FATAL) << "Attempting to move tasks from unrecognized state "
@@ -267,9 +296,6 @@ void SchedulingQueue::MoveTasks(std::unordered_set<TaskID> &task_ids, TaskState
   case TaskState::RUNNING:
     QueueTasks(running_tasks_, removed_tasks);
     break;
-  case TaskState::BLOCKED:
-    QueueTasks(blocked_tasks_, removed_tasks);
-    break;
   case TaskState::INFEASIBLE:
     QueueTasks(infeasible_tasks_, removed_tasks);
     break;
@@ -288,7 +314,7 @@ bool SchedulingQueue::HasTask(const TaskID &task_id) const {
   return (methods_waiting_for_actor_creation_.HasTask(task_id) ||
           waiting_tasks_.HasTask(task_id) || placeable_tasks_.HasTask(task_id) ||
           ready_tasks_.HasTask(task_id) || running_tasks_.HasTask(task_id) ||
-          blocked_tasks_.HasTask(task_id) || infeasible_tasks_.HasTask(task_id));
+          infeasible_tasks_.HasTask(task_id));
 }
 
 void SchedulingQueue::QueueWaitingTasks(const std::vector<Task> &tasks) {
@@ -307,10 +333,6 @@ void SchedulingQueue::QueueRunningTasks(const std::vector<Task> &tasks) {
   QueueTasks(running_tasks_, tasks);
 }
 
-void SchedulingQueue::QueueBlockedTasks(const std::vector<Task> &tasks) {
-  QueueTasks(blocked_tasks_, tasks);
-}
-
 std::unordered_set<TaskID> SchedulingQueue::GetTaskIdsForDriver(
     const DriverID &driver_id) const {
   std::unordered_set<TaskID> task_ids;
@@ -320,7 +342,6 @@ std::unordered_set<TaskID> SchedulingQueue::GetTaskIdsForDriver(
   GetDriverTasksFromQueue(placeable_tasks_, driver_id, task_ids);
   GetDriverTasksFromQueue(ready_tasks_, driver_id, task_ids);
   GetDriverTasksFromQueue(running_tasks_, driver_id, task_ids);
-  GetDriverTasksFromQueue(blocked_tasks_, driver_id, task_ids);
   GetDriverTasksFromQueue(infeasible_tasks_, driver_id, task_ids);
 
   return task_ids;
@@ -335,12 +356,21 @@ std::unordered_set<TaskID> SchedulingQueue::GetTaskIdsForActor(
   GetActorTasksFromQueue(placeable_tasks_, actor_id, task_ids);
   GetActorTasksFromQueue(ready_tasks_, actor_id, task_ids);
   GetActorTasksFromQueue(running_tasks_, actor_id, task_ids);
-  GetActorTasksFromQueue(blocked_tasks_, actor_id, task_ids);
   GetActorTasksFromQueue(infeasible_tasks_, actor_id, task_ids);
 
   return task_ids;
 }
 
+void SchedulingQueue::AddBlockedTaskId(const TaskID &task_id) {
+  auto inserted = blocked_task_ids_.insert(task_id);
+  RAY_CHECK(inserted.second);
+}
+
+void SchedulingQueue::RemoveBlockedTaskId(const TaskID &task_id) {
+  auto erased = blocked_task_ids_.erase(task_id);
+  RAY_CHECK(erased == 1);
+}
+
 void SchedulingQueue::AddDriverTaskId(const TaskID &driver_id) {
   auto inserted = driver_task_ids_.insert(driver_id);
   RAY_CHECK(inserted.second);
@@ -355,24 +385,17 @@ const std::unordered_set<TaskID> &SchedulingQueue::GetDriverTaskIds() const {
   return driver_task_ids_;
 }
 
-const std::string SchedulingQueue::ToString() const {
-  std::string result;
-
-  result += "placeable_tasks_ size is " +
-            std::to_string(placeable_tasks_.GetTasks().size()) + "\n";
-  result +=
-      "waiting_tasks_ size is " + std::to_string(waiting_tasks_.GetTasks().size()) + "\n";
-  result +=
-      "ready_tasks_ size is " + std::to_string(ready_tasks_.GetTasks().size()) + "\n";
-  result +=
-      "running_tasks_ size is " + std::to_string(running_tasks_.GetTasks().size()) + "\n";
-  result +=
-      "blocked_tasks_ size is " + std::to_string(blocked_tasks_.GetTasks().size()) + "\n";
-  result += "infeasible_tasks_ size is " +
-            std::to_string(infeasible_tasks_.GetTasks().size()) + "\n";
-  result += "methods_waiting_for_actor_creation_ size is " +
-            std::to_string(methods_waiting_for_actor_creation_.GetTasks().size()) + "\n";
-  return result;
+std::string SchedulingQueue::DebugString() const {
+  std::stringstream result;
+  result << "SchedulingQueue:";
+  result << "\n- num placeable tasks: " << placeable_tasks_.GetTasks().size();
+  result << "\n- num waiting tasks: " << waiting_tasks_.GetTasks().size();
+  result << "\n- num ready tasks: " << ready_tasks_.GetTasks().size();
+  result << "\n- num running tasks: " << running_tasks_.GetTasks().size();
+  result << "\n- num infeasible tasks: " << infeasible_tasks_.GetTasks().size();
+  result << "\n- num methods waiting for actor creation: "
+         << methods_waiting_for_actor_creation_.GetTasks().size();
+  return result.str();
 }
 
 }  // namespace raylet
diff --git a/src/ray/raylet/scheduling_queue.h b/src/ray/raylet/scheduling_queue.h
index d8ecf6ae908ff..bdd065fa176be 100644
--- a/src/ray/raylet/scheduling_queue.h
+++ b/src/ray/raylet/scheduling_queue.h
@@ -7,6 +7,8 @@
 #include <vector>
 
 #include "ray/raylet/task.h"
+#include "ray/util/logging.h"
+#include "ray/util/ordered_set.h"
 
 namespace ray {
 
@@ -14,13 +16,113 @@ namespace raylet {
 
 enum class TaskState {
   INIT,
+  // The task may be placed on a node.
   PLACEABLE,
+  // The task has been placed on a node and is waiting for some object
+  // dependencies to become local.
   WAITING,
+  // The task has been placed on a node, all dependencies are satisfied, and is
+  // waiting for resources to run.
   READY,
+  // The task is running on a worker. The task may also be blocked in a ray.get
+  // or ray.wait call, in which case it also has state BLOCKED.
   RUNNING,
+  // The task is running but blocked in a ray.get or ray.wait call. Tasks that
+  // were explicitly assigned by us may be both BLOCKED and RUNNING, while
+  // tasks that were created out-of-band (e.g., the application created
+  // multiple threads) are only BLOCKED.
   BLOCKED,
+  // The task is a driver task.
   DRIVER,
-  INFEASIBLE
+  // The task has resources that cannot be satisfied by any node, as far as we
+  // know.
+  INFEASIBLE,
+  // The task is an actor method and is waiting to learn where the actor was
+  // created.
+  WAITING_FOR_ACTOR,
+};
+
+class TaskQueue {
+ public:
+  /// \brief Append a task to queue.
+  ///
+  /// \param task_id The task ID for the task to append.
+  /// \param task The task to append to the queue.
+  /// \return Whether the append operation succeeds.
+  bool AppendTask(const TaskID &task_id, const Task &task);
+
+  /// \brief Remove a task from queue.
+  ///
+  /// \param task_id The task ID for the task to remove from the queue.
+  /// \param removed_tasks If the task specified by task_id is successfully
+  ///  removed from the queue, the task data is appended to the vector. Can
+  ///  be a nullptr, in which case nothing is appended.
+  /// \return Whether the removal succeeds.
+  bool RemoveTask(const TaskID &task_id, std::vector<Task> *removed_tasks = nullptr);
+
+  /// \brief Check if the queue contains a specific task id.
+  ///
+  /// \param task_id The task ID for the task.
+  /// \return Whether the task_id exists in this queue.
+  bool HasTask(const TaskID &task_id) const;
+
+  /// \brief Return the task list of the queue.
+  /// \return A list of tasks contained in this queue.
+  const std::list<Task> &GetTasks() const;
+
+  /// \brief Get the total resources required by the tasks in the queue.
+  /// \return Total resources required by the tasks in the queue.
+  const ResourceSet &GetCurrentResourceLoad() const;
+
+ protected:
+  /// A list of tasks.
+  std::list<Task> task_list_;
+  /// A hash to speed up looking up a task.
+  std::unordered_map<TaskID, std::list<Task>::iterator> task_map_;
+  /// Aggregate resources of all the tasks in this queue.
+  ResourceSet current_resource_load_;
+};
+
+class ReadyQueue : public TaskQueue {
+ public:
+  ReadyQueue(){};
+
+  ReadyQueue(const ReadyQueue &other) = delete;
+
+  /// \brief Append a task to queue.
+  ///
+  /// \param task_id The task ID for the task to append.
+  /// \param task The task to append to the queue.
+  /// \return Whether the append operation succeeds.
+  bool AppendTask(const TaskID &task_id, const Task &task);
+
+  /// \brief Remove a task from queue.
+  ///
+  /// \param task_id The task ID for the task to remove from the queue.
+  /// \return Whether the removal succeeds.
+  bool RemoveTask(const TaskID &task_id, std::vector<Task> *removed_tasks);
+
+  /// \brief Get task associated to task_id in this queue.
+  ///
+  /// \param task_id The task ID for the task to get.
+  /// \return The task corresponding to task_id.
+  const Task &GetTask(const TaskID &task_id) const {
+    auto it = task_map_.find(task_id);
+    RAY_CHECK(it != task_map_.end());
+    return *it->second;
+  }
+
+  /// \brief Get a mapping from resource shape to tasks.
+  ///
+  /// \return Mapping from resource set to task IDs with these resource requirements.
+  const std::unordered_map<ResourceSet, ordered_set<TaskID>> &GetTasksWithResources()
+      const {
+    return tasks_with_resources_;
+  }
+
+ private:
+  /// Index from resource shape to tasks that require these resources.
+  std::unordered_map<ResourceSet, ordered_set<TaskID>> tasks_with_resources_;
 };
 
 /// \class SchedulingQueue
@@ -78,6 +180,11 @@ class SchedulingQueue {
   /// to execute but that are waiting for a worker.
   const std::list<Task> &GetReadyTasks() const;
 
+  /// Get a reference to the queue of ready tasks.
+  ///
+  /// \return A reference to the queue of ready tasks.
+  const ReadyQueue &GetReadyQueue() const { return ready_tasks_; }
+
   /// Get the queue of tasks in the running state.
   ///
   /// \return A const reference to the queue of tasks that are currently
@@ -86,10 +193,12 @@ class SchedulingQueue {
 
   /// Get the tasks in the blocked state.
   ///
-  /// \return A const reference to the queue of tasks that have been dispatched
-  /// to a worker but are blocked on a data dependency discovered to be missing
-  /// at runtime.
-  const std::list<Task> &GetBlockedTasks() const;
+  /// \return A const reference to the tasks that are are blocked on a data
+  /// dependency discovered to be missing at runtime. These include RUNNING
+  /// tasks that were explicitly assigned to a worker by us, as well as tasks
+  /// that were created out-of-band (e.g., the application created
+  // multiple threads) are only BLOCKED.
+  const std::unordered_set<TaskID> &GetBlockedTaskIds() const;
 
   /// Get the set of driver task IDs.
   ///
@@ -102,15 +211,20 @@ class SchedulingQueue {
   /// \param tasks The set of task IDs to remove from the queue. The
   /// corresponding tasks must be contained in the queue. The IDs of removed
   /// tasks will be erased from the set.
+  /// \param task_states If this is not nullptr, then, the states of the removed
+  /// tasks will be appended to this vector.
   /// \return A vector of the tasks that were removed.
-  std::vector<Task> RemoveTasks(std::unordered_set<TaskID> &tasks);
+  std::vector<Task> RemoveTasks(std::unordered_set<TaskID> &task_ids,
+                                std::vector<TaskState> *task_states = nullptr);
 
   /// Remove a task from the task queue.
   ///
   /// \param task_id The task ID to remove from the queue. The corresponding
   /// task must be contained in the queue.
+  /// \param task_state If this is not nullptr, then the state of the removed
+  /// task will be written here.
   /// \return The task that was removed.
-  Task RemoveTask(const TaskID &task_id);
+  Task RemoveTask(const TaskID &task_id, TaskState *task_state = nullptr);
 
   /// Remove a driver task ID. This is an empty task used to represent a driver.
   ///
@@ -143,12 +257,19 @@ class SchedulingQueue {
   /// \param tasks The tasks to queue.
   void QueueRunningTasks(const std::vector<Task> &tasks);
 
-  /// Queue tasks in the blocked state. These are tasks that have been
+  /// Add a task ID in the blocked state. These are tasks that have been
   /// dispatched to a worker but are blocked on a data dependency that was
   /// discovered to be missing at runtime.
   ///
-  /// \param tasks The tasks to queue.
-  void QueueBlockedTasks(const std::vector<Task> &tasks);
+  /// \param task_id The task to mark as blocked.
+  void AddBlockedTaskId(const TaskID &task_id);
+
+  /// Remove a task ID in the blocked state. These are tasks that have been
+  /// dispatched to a worker but were blocked on a data dependency that was
+  /// discovered to be missing at runtime.
+  ///
+  /// \param task_id The task to mark as unblocked.
+  void RemoveBlockedTaskId(const TaskID &task_id);
 
   /// Add a driver task ID. This is an empty task used to represent a driver.
   ///
@@ -191,58 +312,10 @@ class SchedulingQueue {
   /// \return Aggregate resource demand from ready tasks.
   ResourceSet GetReadyQueueResources() const;
 
-  /// Return a human-readable string indicating the number of tasks in each
-  /// queue.
-  ///
-  /// \return A string that can be used to display the contents of the queues
-  /// for debugging purposes.
-  const std::string ToString() const;
-
-  class TaskQueue {
-   public:
-    /// Creating a task queue.
-    TaskQueue() {}
-
-    /// Destructor for task queue.
-    ~TaskQueue();
-
-    /// \brief Append a task to queue.
-    ///
-    /// \param task_id The task ID for the task to append.
-    /// \param task The task to append to the queue.
-    /// \return Whether the append operation succeeds.
-    bool AppendTask(const TaskID &task_id, const Task &task);
-
-    /// \brief Remove a task from queue.
-    ///
-    /// \param task_id The task ID for the task to remove from the queue.
-    /// \return Whether the removal succeeds.
-    bool RemoveTask(const TaskID &task_id);
-
-    /// \brief Remove a task from queue.
-    ///
-    /// \param task_id The task ID for the task to remove from the queue.
-    /// \param removed_tasks If the task specified by task_id is successfully
-    //  removed from the queue, the task data is appended to the vector.
-    /// \return Whether the removal succeeds.
-    bool RemoveTask(const TaskID &task_id, std::vector<Task> &removed_tasks);
-
-    /// \brief Check if the queue contains a specific task id.
-    ///
-    /// \param task_id The task ID for the task.
-    /// \return Whether the task_id exists in this queue.
-    bool HasTask(const TaskID &task_id) const;
-
-    /// \brief Remove the task list of the queue.
-    /// \return A list of tasks contained in this queue.
-    const std::list<Task> &GetTasks() const;
-
-   private:
-    // A list of tasks.
-    std::list<Task> task_list_;
-    // A hash to speed up looking up a task.
-    std::unordered_map<TaskID, std::list<Task>::iterator> task_map_;
-  };
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
 
  private:
   /// Tasks that are destined for actors that have not yet been created.
@@ -253,24 +326,18 @@ class SchedulingQueue {
   /// waiting to be scheduled.
   TaskQueue placeable_tasks_;
   /// Tasks ready for dispatch, but that are waiting for a worker.
-  TaskQueue ready_tasks_;
+  ReadyQueue ready_tasks_;
   /// Tasks that are running on a worker.
   TaskQueue running_tasks_;
   /// Tasks that were dispatched to a worker but are blocked on a data
   /// dependency that was missing at runtime.
-  TaskQueue blocked_tasks_;
+  std::unordered_set<TaskID> blocked_task_ids_;
   /// Tasks that require resources that are not available on any of the nodes
   /// in the cluster.
   TaskQueue infeasible_tasks_;
   /// The set of currently running driver tasks. These are empty tasks that are
   /// started by a driver process on initialization.
   std::unordered_set<TaskID> driver_task_ids_;
-
-  /// \brief Return all resource demand associated with the specified task queue.
-  ///
-  /// \param task_queue The task queue for which aggregate resource demand is calculated.
-  /// \return Aggregate resource demand.
-  ResourceSet GetQueueResources(const TaskQueue &task_queue) const;
 };
 
 }  // namespace raylet
diff --git a/src/ray/raylet/scheduling_resources.cc b/src/ray/raylet/scheduling_resources.cc
index 49519c4932908..03c85dfbe7a57 100644
--- a/src/ray/raylet/scheduling_resources.cc
+++ b/src/ray/raylet/scheduling_resources.cc
@@ -1,6 +1,7 @@
 #include "scheduling_resources.h"
 
 #include <cmath>
+#include <sstream>
 
 #include "ray/util/logging.h"
 
@@ -17,7 +18,7 @@ ResourceSet::ResourceSet(const std::vector<std::string> &resource_labels,
                          const std::vector<double> resource_capacity) {
   RAY_CHECK(resource_labels.size() == resource_capacity.size());
   for (uint i = 0; i < resource_labels.size(); i++) {
-    RAY_CHECK(this->AddResource(resource_labels[i], resource_capacity[i]));
+    RAY_CHECK(AddResource(resource_labels[i], resource_capacity[i]));
   }
 }
 
@@ -60,6 +61,7 @@ bool ResourceSet::IsSubset(const ResourceSet &other) const {
 bool ResourceSet::IsSuperset(const ResourceSet &other) const {
   return other.IsSubset(*this);
 }
+
 /// Test whether this ResourceSet is precisely equal to the other ResourceSet.
 bool ResourceSet::IsEqual(const ResourceSet &rhs) const {
   return (this->IsSubset(rhs) && rhs.IsSubset(*this));
@@ -69,9 +71,11 @@ bool ResourceSet::AddResource(const std::string &resource_name, double capacity)
   resource_capacity_[resource_name] = capacity;
   return true;
 }
+
 bool ResourceSet::RemoveResource(const std::string &resource_name) {
   throw std::runtime_error("Method not implemented");
 }
+
 bool ResourceSet::SubtractResourcesStrict(const ResourceSet &other) {
   // Subtract the resources and track whether a resource goes below zero.
   bool oversubscribed = false;
@@ -119,11 +123,11 @@ bool ResourceSet::GetResource(const std::string &resource_name, double *value) c
   if (!value) {
     return false;
   }
-  if (this->resource_capacity_.count(resource_name) == 0) {
+  if (resource_capacity_.count(resource_name) == 0) {
     *value = std::nan("");
     return false;
   }
-  *value = this->resource_capacity_.at(resource_name);
+  *value = resource_capacity_.at(resource_name);
   return true;
 }
 
@@ -135,15 +139,25 @@ double ResourceSet::GetNumCpus() const {
 
 const std::string ResourceSet::ToString() const {
   std::string return_string = "";
-  for (const auto &resource_pair : this->resource_capacity_) {
-    return_string +=
-        "{" + resource_pair.first + "," + std::to_string(resource_pair.second) + "}, ";
+
+  auto it = resource_capacity_.begin();
+
+  // Convert the first element to a string.
+  if (it != resource_capacity_.end()) {
+    return_string += "{" + it->first + "," + std::to_string(it->second) + "}";
+    it++;
   }
+
+  // Add the remaining elements to the string (along with a comma).
+  for (; it != resource_capacity_.end(); ++it) {
+    return_string += ",{" + it->first + "," + std::to_string(it->second) + "}";
+  }
+
   return return_string;
 }
 
 const std::unordered_map<std::string, double> &ResourceSet::GetResourceMap() const {
-  return this->resource_capacity_;
+  return resource_capacity_;
 };
 
 /// ResourceIds class implementation
@@ -400,11 +414,20 @@ ResourceSet ResourceIdSet::ToResourceSet() const {
 
 std::string ResourceIdSet::ToString() const {
   std::string return_string = "AvailableResources: ";
-  for (auto const &resource_pair : available_resources_) {
-    return_string += resource_pair.first + ": {";
-    return_string += resource_pair.second.ToString();
-    return_string += "}, ";
+
+  auto it = available_resources_.begin();
+
+  // Convert the first element to a string.
+  if (it != available_resources_.end()) {
+    return_string += (it->first + ": {" + it->second.ToString() + "}");
+  }
+  it++;
+
+  // Add the remaining elements to the string (along with a comma).
+  for (; it != available_resources_.end(); ++it) {
+    return_string += (", " + it->first + ": {" + it->second.ToString() + "}");
   }
+
   return return_string;
 }
 
@@ -450,26 +473,26 @@ SchedulingResources::~SchedulingResources() {}
 
 ResourceAvailabilityStatus SchedulingResources::CheckResourcesSatisfied(
     ResourceSet &resources) const {
-  if (!resources.IsSubset(this->resources_total_)) {
+  if (!resources.IsSubset(resources_total_)) {
     return ResourceAvailabilityStatus::kInfeasible;
   }
   // Resource demand specified is feasible. Check if it's available.
-  if (!resources.IsSubset(this->resources_available_)) {
+  if (!resources.IsSubset(resources_available_)) {
     return ResourceAvailabilityStatus::kResourcesUnavailable;
   }
   return ResourceAvailabilityStatus::kFeasible;
 }
 
 const ResourceSet &SchedulingResources::GetAvailableResources() const {
-  return this->resources_available_;
+  return resources_available_;
 }
 
 void SchedulingResources::SetAvailableResources(ResourceSet &&newset) {
-  this->resources_available_ = newset;
+  resources_available_ = newset;
 }
 
 const ResourceSet &SchedulingResources::GetTotalResources() const {
-  return this->resources_total_;
+  return resources_total_;
 }
 
 void SchedulingResources::SetLoadResources(ResourceSet &&newset) {
@@ -482,14 +505,21 @@ const ResourceSet &SchedulingResources::GetLoadResources() const {
 
 // Return specified resources back to SchedulingResources.
 bool SchedulingResources::Release(const ResourceSet &resources) {
-  return this->resources_available_.AddResourcesStrict(resources);
+  return resources_available_.AddResourcesStrict(resources);
 }
 
 // Take specified resources from SchedulingResources.
 bool SchedulingResources::Acquire(const ResourceSet &resources) {
-  return this->resources_available_.SubtractResourcesStrict(resources);
+  return resources_available_.SubtractResourcesStrict(resources);
 }
 
+std::string SchedulingResources::DebugString() const {
+  std::stringstream result;
+  result << "\n- total: " << resources_total_.ToString();
+  result << "\n- avail: " << resources_available_.ToString();
+  return result.str();
+};
+
 }  // namespace raylet
 
 }  // namespace ray
diff --git a/src/ray/raylet/scheduling_resources.h b/src/ray/raylet/scheduling_resources.h
index bac293366f32e..80b2abea641f6 100644
--- a/src/ray/raylet/scheduling_resources.h
+++ b/src/ray/raylet/scheduling_resources.h
@@ -374,6 +374,11 @@ class SchedulingResources {
   /// negative resources.
   bool Acquire(const ResourceSet &resources);
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  private:
   /// Static resource configuration (e.g., static_resources).
   ResourceSet resources_total_;
@@ -387,4 +392,18 @@ class SchedulingResources {
 
 }  // namespace ray
 
+namespace std {
+template <>
+struct hash<ray::raylet::ResourceSet> {
+  size_t operator()(ray::raylet::ResourceSet const &k) const {
+    size_t seed = k.GetResourceMap().size();
+    for (auto &elem : k.GetResourceMap()) {
+      seed ^= std::hash<std::string>()(elem.first);
+      seed ^= std::hash<double>()(elem.second);
+    }
+    return seed;
+  }
+};
+}
+
 #endif  // RAY_RAYLET_SCHEDULING_RESOURCES_H
diff --git a/src/ray/raylet/task_dependency_manager.cc b/src/ray/raylet/task_dependency_manager.cc
index df4546efa009c..16e90d3e8a608 100644
--- a/src/ray/raylet/task_dependency_manager.cc
+++ b/src/ray/raylet/task_dependency_manager.cc
@@ -170,10 +170,12 @@ bool TaskDependencyManager::SubscribeDependencies(
   return (task_entry.num_missing_dependencies == 0);
 }
 
-void TaskDependencyManager::UnsubscribeDependencies(const TaskID &task_id) {
+bool TaskDependencyManager::UnsubscribeDependencies(const TaskID &task_id) {
   // Remove the task from the table of subscribed tasks.
   auto it = task_dependencies_.find(task_id);
-  RAY_CHECK(it != task_dependencies_.end());
+  if (it == task_dependencies_.end()) {
+    return false;
+  }
 
   const TaskDependencies task_entry = std::move(it->second);
   task_dependencies_.erase(it);
@@ -206,6 +208,8 @@ void TaskDependencyManager::UnsubscribeDependencies(const TaskID &task_id) {
   for (const auto &object_id : task_entry.object_dependencies) {
     HandleRemoteDependencyCanceled(object_id);
   }
+
+  return true;
 }
 
 std::vector<TaskID> TaskDependencyManager::GetPendingTasks() const {
@@ -325,6 +329,17 @@ void TaskDependencyManager::RemoveTasksAndRelatedObjects(
   }
 }
 
+std::string TaskDependencyManager::DebugString() const {
+  std::stringstream result;
+  result << "TaskDependencyManager:";
+  result << "\n- task dep map size: " << task_dependencies_.size();
+  result << "\n- task req map size: " << required_tasks_.size();
+  result << "\n- req objects map size: " << required_objects_.size();
+  result << "\n- local objects map size: " << local_objects_.size();
+  result << "\n- pending tasks map size: " << pending_tasks_.size();
+  return result.str();
+}
+
 }  // namespace raylet
 
 }  // namespace ray
diff --git a/src/ray/raylet/task_dependency_manager.h b/src/ray/raylet/task_dependency_manager.h
index 84c47bd16d9a5..bb49f4bc182a3 100644
--- a/src/ray/raylet/task_dependency_manager.h
+++ b/src/ray/raylet/task_dependency_manager.h
@@ -61,7 +61,8 @@ class TaskDependencyManager {
   /// then they will be canceled.
   ///
   /// \param task_id The ID of the task whose dependencies to unsubscribe from.
-  void UnsubscribeDependencies(const TaskID &task_id);
+  /// \return Whether the task was subscribed before.
+  bool UnsubscribeDependencies(const TaskID &task_id);
 
   /// Mark that the given task is pending execution. Any objects that it creates
   /// are now considered to be pending creation. If there are any subscribed
@@ -111,6 +112,11 @@ class TaskDependencyManager {
   /// \param task_ids The collection of task IDs.
   void RemoveTasksAndRelatedObjects(const std::unordered_set<TaskID> &task_ids);
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  private:
   using ObjectDependencyMap = std::unordered_map<ray::ObjectID, std::vector<ray::TaskID>>;
 
diff --git a/src/ray/raylet/task_spec.cc b/src/ray/raylet/task_spec.cc
index b9fd35f02ea5d..0a914adcb0c66 100644
--- a/src/ray/raylet/task_spec.cc
+++ b/src/ray/raylet/task_spec.cc
@@ -1,7 +1,8 @@
 #include "task_spec.h"
 
-#include "common.h"
-#include "common_protocol.h"
+#include "ray/common/common_protocol.h"
+#include "ray/gcs/format/gcs_generated.h"
+#include "ray/util/logging.h"
 
 namespace ray {
 
@@ -31,6 +32,18 @@ flatbuffers::Offset<Arg> TaskArgumentByValue::ToFlatbuffer(
 
 void TaskSpecification::AssignSpecification(const uint8_t *spec, size_t spec_size) {
   spec_.assign(spec, spec + spec_size);
+  // Initialize required_resources_ and required_placement_resources_
+  auto message = flatbuffers::GetRoot<TaskInfo>(spec_.data());
+  auto required_resources = map_from_flatbuf(*message->required_resources());
+  auto required_placement_resources =
+      map_from_flatbuf(*message->required_placement_resources());
+  // If the required_placement_resources field is empty, then the placement
+  // resources default to the required resources.
+  if (required_placement_resources.size() == 0) {
+    required_placement_resources = required_resources;
+  }
+  required_resources_ = ResourceSet(required_resources);
+  required_placement_resources_ = ResourceSet(required_placement_resources);
 }
 
 TaskSpecification::TaskSpecification(const flatbuffers::String &string) {
@@ -50,7 +63,7 @@ TaskSpecification::TaskSpecification(
     : TaskSpecification(driver_id, parent_task_id, parent_counter, ActorID::nil(),
                         ObjectID::nil(), ActorID::nil(), ActorHandleID::nil(), -1,
                         function_id, task_arguments, num_returns, required_resources,
-                        language) {}
+                        std::unordered_map<std::string, double>(), language) {}
 
 TaskSpecification::TaskSpecification(
     const UniqueID &driver_id, const TaskID &parent_task_id, int64_t parent_counter,
@@ -59,6 +72,7 @@ TaskSpecification::TaskSpecification(
     const FunctionID &function_id,
     const std::vector<std::shared_ptr<TaskArgument>> &task_arguments, int64_t num_returns,
     const std::unordered_map<std::string, double> &required_resources,
+    const std::unordered_map<std::string, double> &required_placement_resources,
     const Language &language)
     : spec_() {
   flatbuffers::FlatBufferBuilder fbb;
@@ -78,20 +92,6 @@ TaskSpecification::TaskSpecification(
     returns.push_back(to_flatbuf(fbb, return_id));
   }
 
-  // convert Language to TaskLanguage
-  // TODO(raulchen): remove this once we get rid of legacy ray.
-  TaskLanguage task_language = TaskLanguage::PYTHON;
-  switch (language) {
-  case Language::PYTHON:
-    task_language = TaskLanguage::PYTHON;
-    break;
-  case Language::JAVA:
-    task_language = TaskLanguage::JAVA;
-    break;
-  default:
-    RAY_LOG(FATAL) << "Unknown language: " << static_cast<int32_t>(language);
-  }
-
   // Serialize the TaskSpecification.
   auto spec = CreateTaskInfo(
       fbb, to_flatbuf(fbb, driver_id), to_flatbuf(fbb, task_id),
@@ -99,7 +99,8 @@ TaskSpecification::TaskSpecification(
       to_flatbuf(fbb, actor_creation_dummy_object_id), to_flatbuf(fbb, actor_id),
       to_flatbuf(fbb, actor_handle_id), actor_counter, false,
       to_flatbuf(fbb, function_id), fbb.CreateVector(arguments),
-      fbb.CreateVector(returns), map_to_flatbuf(fbb, required_resources), task_language);
+      fbb.CreateVector(returns), map_to_flatbuf(fbb, required_resources),
+      map_to_flatbuf(fbb, required_placement_resources), language);
   fbb.Finish(spec);
   AssignSpecification(fbb.GetBufferPointer(), fbb.GetSize());
 }
@@ -125,10 +126,12 @@ UniqueID TaskSpecification::DriverId() const {
   return from_flatbuf(*message->driver_id());
 }
 TaskID TaskSpecification::ParentTaskId() const {
-  throw std::runtime_error("Method not implemented");
+  auto message = flatbuffers::GetRoot<TaskInfo>(spec_.data());
+  return from_flatbuf(*message->parent_task_id());
 }
 int64_t TaskSpecification::ParentCounter() const {
-  throw std::runtime_error("Method not implemented");
+  auto message = flatbuffers::GetRoot<TaskInfo>(spec_.data());
+  return message->parent_counter();
 }
 FunctionID TaskSpecification::FunctionId() const {
   auto message = flatbuffers::GetRoot<TaskInfo>(spec_.data());
@@ -164,19 +167,31 @@ ObjectID TaskSpecification::ArgId(int64_t arg_index, int64_t id_index) const {
   auto message = flatbuffers::GetRoot<TaskInfo>(spec_.data());
   return from_flatbuf(*message->args()->Get(arg_index)->object_ids()->Get(id_index));
 }
+
 const uint8_t *TaskSpecification::ArgVal(int64_t arg_index) const {
-  throw std::runtime_error("Method not implemented");
+  auto message = flatbuffers::GetRoot<TaskInfo>(spec_.data());
+  return reinterpret_cast<const uint8_t *>(
+      message->args()->Get(arg_index)->data()->c_str());
 }
+
 size_t TaskSpecification::ArgValLength(int64_t arg_index) const {
-  throw std::runtime_error("Method not implemented");
+  auto message = flatbuffers::GetRoot<TaskInfo>(spec_.data());
+  return message->args()->Get(arg_index)->data()->size();
 }
+
 double TaskSpecification::GetRequiredResource(const std::string &resource_name) const {
-  throw std::runtime_error("Method not implemented");
+  RAY_CHECK(required_resources_.GetResourceMap().empty() == false);
+  auto it = required_resources_.GetResourceMap().find(resource_name);
+  RAY_CHECK(it != required_resources_.GetResourceMap().end());
+  return it->second;
 }
+
 const ResourceSet TaskSpecification::GetRequiredResources() const {
-  auto message = flatbuffers::GetRoot<TaskInfo>(spec_.data());
-  auto required_resources = map_from_flatbuf(*message->required_resources());
-  return ResourceSet(required_resources);
+  return required_resources_;
+}
+
+const ResourceSet TaskSpecification::GetRequiredPlacementResources() const {
+  return required_placement_resources_;
 }
 
 bool TaskSpecification::IsDriverTask() const {
@@ -186,18 +201,7 @@ bool TaskSpecification::IsDriverTask() const {
 
 Language TaskSpecification::GetLanguage() const {
   auto message = flatbuffers::GetRoot<TaskInfo>(spec_.data());
-  // TODO(raulchen): remove this once we get rid of legacy ray.
-  auto language = message->language();
-  switch (language) {
-  case TaskLanguage::PYTHON:
-    return Language::PYTHON;
-  case TaskLanguage::JAVA:
-    return Language::JAVA;
-  default:
-    // This shouldn't be reachable.
-    RAY_LOG(FATAL) << "Unknown task language: " << static_cast<int32_t>(language);
-    return Language::PYTHON;
-  }
+  return message->language();
 }
 
 bool TaskSpecification::IsActorCreationTask() const {
diff --git a/src/ray/raylet/task_spec.h b/src/ray/raylet/task_spec.h
index a4075ff6a1db9..5a86a443c78e3 100644
--- a/src/ray/raylet/task_spec.h
+++ b/src/ray/raylet/task_spec.h
@@ -6,12 +6,12 @@
 #include <unordered_map>
 #include <vector>
 
-#include "format/common_generated.h"
+#include "ray/gcs/format/gcs_generated.h"
 #include "ray/id.h"
 #include "ray/raylet/scheduling_resources.h"
 
 extern "C" {
-#include "sha256.h"
+#include "ray/thirdparty/sha256.h"
 }
 
 namespace ray {
@@ -83,34 +83,61 @@ class TaskSpecification {
   TaskSpecification(const flatbuffers::String &string);
 
   // TODO(swang): Define an actor task constructor.
-  /// Create a task specification from the raw fields.
+  /// Create a task specification from the raw fields. This constructor omits
+  /// some values and sets them to sensible defaults.
   ///
   /// \param driver_id The driver ID, representing the job that this task is a
-  ///        part of.
+  /// part of.
   /// \param parent_task_id The task ID of the task that spawned this task.
   /// \param parent_counter The number of tasks that this task's parent spawned
-  ///        before this task.
+  /// before this task.
   /// \param function_id The ID of the function this task should execute.
-  /// \param arguments The list of task arguments.
+  /// \param task_arguments The list of task arguments.
   /// \param num_returns The number of values returned by the task.
   /// \param required_resources The task's resource demands.
+  /// \param language The language of the worker that must execute the function.
   TaskSpecification(const UniqueID &driver_id, const TaskID &parent_task_id,
                     int64_t parent_counter, const FunctionID &function_id,
-                    const std::vector<std::shared_ptr<TaskArgument>> &arguments,
-                    int64_t num_returns,
-                    const std::unordered_map<std::string, double> &required_resources,
-                    const Language &language);
-
-  TaskSpecification(const UniqueID &driver_id, const TaskID &parent_task_id,
-                    int64_t parent_counter, const ActorID &actor_creation_id,
-                    const ObjectID &actor_creation_dummy_object_id,
-                    const ActorID &actor_id, const ActorHandleID &actor_handle_id,
-                    int64_t actor_counter, const FunctionID &function_id,
                     const std::vector<std::shared_ptr<TaskArgument>> &task_arguments,
                     int64_t num_returns,
                     const std::unordered_map<std::string, double> &required_resources,
                     const Language &language);
 
+  // TODO(swang): Define an actor task constructor.
+  /// Create a task specification from the raw fields.
+  ///
+  /// \param driver_id The driver ID, representing the job that this task is a
+  /// part of.
+  /// \param parent_task_id The task ID of the task that spawned this task.
+  /// \param parent_counter The number of tasks that this task's parent spawned
+  /// before this task.
+  /// \param actor_creation_id If this is an actor task, then this is the ID of
+  /// the corresponding actor creation task. Otherwise, this is nil.
+  /// \param actor_id The ID of the actor for the task. If this is not an actor
+  /// task, then this is nil.
+  /// \param actor_handle_id The ID of the actor handle that submitted this
+  /// task. If this is not an actor task, then this is nil.
+  /// \param actor_counter The number of tasks submitted before this task from
+  /// the same actor handle. If this is not an actor task, then this is 0.
+  /// \param function_id The ID of the function this task should execute.
+  /// \param task_arguments The list of task arguments.
+  /// \param num_returns The number of values returned by the task.
+  /// \param required_resources The task's resource demands.
+  /// \param required_placement_resources The resources required to place this
+  /// task on a node. Typically, this should be an empty map in which case it
+  /// will default to be equal to the required_resources argument.
+  /// \param language The language of the worker that must execute the function.
+  TaskSpecification(
+      const UniqueID &driver_id, const TaskID &parent_task_id, int64_t parent_counter,
+      const ActorID &actor_creation_id, const ObjectID &actor_creation_dummy_object_id,
+      const ActorID &actor_id, const ActorHandleID &actor_handle_id,
+      int64_t actor_counter, const FunctionID &function_id,
+      const std::vector<std::shared_ptr<TaskArgument>> &task_arguments,
+      int64_t num_returns,
+      const std::unordered_map<std::string, double> &required_resources,
+      const std::unordered_map<std::string, double> &required_placement_resources,
+      const Language &language);
+
   /// Deserialize a task specification from a flatbuffer's string data.
   ///
   /// \param string The string data for a serialized task specification
@@ -141,7 +168,22 @@ class TaskSpecification {
   const uint8_t *ArgVal(int64_t arg_index) const;
   size_t ArgValLength(int64_t arg_index) const;
   double GetRequiredResource(const std::string &resource_name) const;
+  /// Return the resources that are to be acquired during the execution of this
+  /// task.
+  ///
+  /// \return The resources that will be acquired during the execution of this
+  /// task.
   const ResourceSet GetRequiredResources() const;
+  /// Return the resources that are required for a task to be placed on a node.
+  /// This will typically be the same as the resources acquired during execution
+  /// and will always be a superset of those resources. However, they may
+  /// differ, e.g., actor creation tasks may require more resources to be
+  /// scheduled on a machine because the actor creation task may require no
+  /// resources itself, but subsequent actor methods may require resources, and
+  /// so the placement of the actor should take this into account.
+  ///
+  /// \return The resources that are required to place a task on a node.
+  const ResourceSet GetRequiredPlacementResources() const;
   bool IsDriverTask() const;
   Language GetLanguage() const;
 
@@ -162,7 +204,10 @@ class TaskSpecification {
   const uint8_t *data() const;
   /// Get the size in bytes of the task specification.
   size_t size() const;
-
+  /// Field storing required resources. Initalized in constructor.
+  ResourceSet required_resources_;
+  /// Field storing required placement resources. Initalized in constructor.
+  ResourceSet required_placement_resources_;
   /// The task specification data.
   std::vector<uint8_t> spec_;
 };
diff --git a/src/ray/raylet/worker.cc b/src/ray/raylet/worker.cc
index 4cbe17104a15f..5a2342514d01a 100644
--- a/src/ray/raylet/worker.cc
+++ b/src/ray/raylet/worker.cc
@@ -2,7 +2,6 @@
 
 #include <boost/bind.hpp>
 
-#include "common.h"
 #include "ray/raylet/format/node_manager_generated.h"
 #include "ray/raylet/raylet.h"
 
@@ -39,6 +38,20 @@ void Worker::AssignTaskId(const TaskID &task_id) { assigned_task_id_ = task_id;
 
 const TaskID &Worker::GetAssignedTaskId() const { return assigned_task_id_; }
 
+bool Worker::AddBlockedTaskId(const TaskID &task_id) {
+  auto inserted = blocked_task_ids_.insert(task_id);
+  return inserted.second;
+}
+
+bool Worker::RemoveBlockedTaskId(const TaskID &task_id) {
+  auto erased = blocked_task_ids_.erase(task_id);
+  return erased == 1;
+}
+
+const std::unordered_set<TaskID> &Worker::GetBlockedTaskIds() const {
+  return blocked_task_ids_;
+}
+
 void Worker::AssignDriverId(const DriverID &driver_id) {
   assigned_driver_id_ = driver_id;
 }
diff --git a/src/ray/raylet/worker.h b/src/ray/raylet/worker.h
index c6ec7bac84d16..4860342e35787 100644
--- a/src/ray/raylet/worker.h
+++ b/src/ray/raylet/worker.h
@@ -31,6 +31,9 @@ class Worker {
   Language GetLanguage() const;
   void AssignTaskId(const TaskID &task_id);
   const TaskID &GetAssignedTaskId() const;
+  bool AddBlockedTaskId(const TaskID &task_id);
+  bool RemoveBlockedTaskId(const TaskID &task_id);
+  const std::unordered_set<TaskID> &GetBlockedTaskIds() const;
   void AssignDriverId(const DriverID &driver_id);
   const DriverID &GetAssignedDriverId() const;
   void AssignActorId(const ActorID &actor_id);
@@ -72,6 +75,7 @@ class Worker {
   /// The specific resource IDs that this worker currently owns for the duration
   // of a task.
   ResourceIdSet task_resource_ids_;
+  std::unordered_set<TaskID> blocked_task_ids_;
 };
 
 }  // namespace raylet
diff --git a/src/ray/raylet/worker_pool.cc b/src/ray/raylet/worker_pool.cc
index 7ed4a1408fb5f..6f5e25d0b28b6 100644
--- a/src/ray/raylet/worker_pool.cc
+++ b/src/ray/raylet/worker_pool.cc
@@ -12,7 +12,7 @@ namespace {
 
 // A helper function to get a worker from a list.
 std::shared_ptr<ray::raylet::Worker> GetWorker(
-    const std::list<std::shared_ptr<ray::raylet::Worker>> &worker_pool,
+    const std::unordered_set<std::shared_ptr<ray::raylet::Worker>> &worker_pool,
     const std::shared_ptr<ray::LocalClientConnection> &connection) {
   for (auto it = worker_pool.begin(); it != worker_pool.end(); it++) {
     if ((*it)->Connection() == connection) {
@@ -24,15 +24,9 @@ std::shared_ptr<ray::raylet::Worker> GetWorker(
 
 // A helper function to remove a worker from a list. Returns true if the worker
 // was found and removed.
-bool RemoveWorker(std::list<std::shared_ptr<ray::raylet::Worker>> &worker_pool,
+bool RemoveWorker(std::unordered_set<std::shared_ptr<ray::raylet::Worker>> &worker_pool,
                   const std::shared_ptr<ray::raylet::Worker> &worker) {
-  for (auto it = worker_pool.begin(); it != worker_pool.end(); it++) {
-    if (*it == worker) {
-      worker_pool.erase(it);
-      return true;
-    }
-  }
-  return false;
+  return worker_pool.erase(worker) > 0;
 }
 
 }  // namespace
@@ -152,7 +146,7 @@ void WorkerPool::RegisterWorker(std::shared_ptr<Worker> worker) {
   auto pid = worker->Pid();
   RAY_LOG(DEBUG) << "Registering worker with pid " << pid;
   auto &state = GetStateForLanguage(worker->GetLanguage());
-  state.registered_workers.push_back(std::move(worker));
+  state.registered_workers.insert(std::move(worker));
 
   auto it = starting_worker_processes_.find(pid);
   RAY_CHECK(it != starting_worker_processes_.end());
@@ -165,7 +159,7 @@ void WorkerPool::RegisterWorker(std::shared_ptr<Worker> worker) {
 void WorkerPool::RegisterDriver(std::shared_ptr<Worker> driver) {
   RAY_CHECK(!driver->GetAssignedTaskId().is_nil());
   auto &state = GetStateForLanguage(driver->GetLanguage());
-  state.registered_drivers.push_back(driver);
+  state.registered_drivers.insert(std::move(driver));
 }
 
 std::shared_ptr<Worker> WorkerPool::GetRegisteredWorker(
@@ -197,7 +191,7 @@ void WorkerPool::PushWorker(std::shared_ptr<Worker> worker) {
   auto &state = GetStateForLanguage(worker->GetLanguage());
   // Add the worker to the idle pool.
   if (worker->GetActorId().is_nil()) {
-    state.idle.push_back(std::move(worker));
+    state.idle.insert(std::move(worker));
   } else {
     state.idle_actor[worker->GetActorId()] = std::move(worker);
   }
@@ -209,8 +203,8 @@ std::shared_ptr<Worker> WorkerPool::PopWorker(const TaskSpecification &task_spec
   std::shared_ptr<Worker> worker = nullptr;
   if (actor_id.is_nil()) {
     if (!state.idle.empty()) {
-      worker = std::move(state.idle.back());
-      state.idle.pop_back();
+      worker = std::move(*state.idle.begin());
+      state.idle.erase(state.idle.begin());
     }
   } else {
     auto actor_entry = state.idle_actor.find(actor_id);
@@ -256,6 +250,16 @@ std::vector<std::shared_ptr<Worker>> WorkerPool::GetWorkersRunningTasksForDriver
   return workers;
 }
 
+std::string WorkerPool::DebugString() const {
+  std::stringstream result;
+  result << "WorkerPool:";
+  for (const auto &entry : states_by_lang_) {
+    result << "\n- num workers: " << entry.second.registered_workers.size();
+    result << "\n- num drivers: " << entry.second.registered_drivers.size();
+  }
+  return result.str();
+}
+
 }  // namespace raylet
 
 }  // namespace ray
diff --git a/src/ray/raylet/worker_pool.h b/src/ray/raylet/worker_pool.h
index 528cc917dd981..32360b769c265 100644
--- a/src/ray/raylet/worker_pool.h
+++ b/src/ray/raylet/worker_pool.h
@@ -2,9 +2,9 @@
 #define RAY_RAYLET_WORKER_POOL_H
 
 #include <inttypes.h>
-#include <list>
 #include <unordered_map>
 #include <unordered_set>
+#include <vector>
 
 #include "ray/common/client_connection.h"
 #include "ray/gcs/format/util.h"
@@ -118,6 +118,11 @@ class WorkerPool {
   std::vector<std::shared_ptr<Worker>> GetWorkersRunningTasksForDriver(
       const DriverID &driver_id) const;
 
+  /// Returns debug string for class.
+  ///
+  /// \return string.
+  std::string DebugString() const;
+
  protected:
   /// A map from the pids of starting worker processes
   /// to the number of their unregistered workers.
@@ -131,15 +136,14 @@ class WorkerPool {
     /// The commands and arguments used to start the worker process
     std::vector<std::string> worker_command;
     /// The pool of idle non-actor workers.
-    std::list<std::shared_ptr<Worker>> idle;
+    std::unordered_set<std::shared_ptr<Worker>> idle;
     /// The pool of idle actor workers.
     std::unordered_map<ActorID, std::shared_ptr<Worker>> idle_actor;
     /// All workers that have registered and are still connected, including both
     /// idle and executing.
-    // TODO(swang): Make this a map to make GetRegisteredWorker faster.
-    std::list<std::shared_ptr<Worker>> registered_workers;
+    std::unordered_set<std::shared_ptr<Worker>> registered_workers;
     /// All drivers that have registered and are still connected.
-    std::list<std::shared_ptr<Worker>> registered_drivers;
+    std::unordered_set<std::shared_ptr<Worker>> registered_drivers;
   };
 
   /// A helper function that returns the reference of the pool state
diff --git a/src/ray/raylet/worker_pool_test.cc b/src/ray/raylet/worker_pool_test.cc
index 2a7e32123c36f..abaf675ff625c 100644
--- a/src/ray/raylet/worker_pool_test.cc
+++ b/src/ray/raylet/worker_pool_test.cc
@@ -65,7 +65,7 @@ static inline TaskSpecification ExampleTaskSpec(
     const Language &language = Language::PYTHON) {
   return TaskSpecification(UniqueID::nil(), UniqueID::nil(), 0, ActorID::nil(),
                            ObjectID::nil(), actor_id, ActorHandleID::nil(), 0,
-                           FunctionID::nil(), {}, 0, {{}}, language);
+                           FunctionID::nil(), {}, 0, {{}}, {{}}, language);
 }
 
 TEST_F(WorkerPoolTest, HandleWorkerRegistration) {
diff --git a/src/ray/test/run_gcs_tests.sh b/src/ray/test/run_gcs_tests.sh
index 973bb81259fd8..b26cf0a34588c 100644
--- a/src/ray/test/run_gcs_tests.sh
+++ b/src/ray/test/run_gcs_tests.sh
@@ -11,12 +11,12 @@ if [[ "${RAY_USE_NEW_GCS}" = "on" ]]; then
     ./src/credis/redis/src/redis-server \
         --loglevel warning \
         --loadmodule ./src/credis/build/src/libmember.so \
-        --loadmodule ./src/common/redis_module/libray_redis_module.so \
+        --loadmodule ./src/ray/gcs/redis_module/libray_redis_module.so \
         --port 6379 &
 else
-    ./src/common/thirdparty/redis/src/redis-server \
+    ./src/ray/thirdparty/redis/src/redis-server \
         --loglevel warning \
-        --loadmodule ./src/common/redis_module/libray_redis_module.so \
+        --loadmodule ./src/ray/gcs/redis_module/libray_redis_module.so \
         --port 6379 &
 fi
 sleep 1s
@@ -24,5 +24,5 @@ sleep 1s
 ./src/ray/gcs/client_test
 ./src/ray/gcs/asio_test
 
-./src/common/thirdparty/redis/src/redis-cli -p 6379 shutdown
+./src/ray/thirdparty/redis/src/redis-cli -p 6379 shutdown
 sleep 1s
diff --git a/src/ray/test/run_object_manager_tests.sh b/src/ray/test/run_object_manager_tests.sh
index 04da7e29adccf..d0363cadfe01a 100644
--- a/src/ray/test/run_object_manager_tests.sh
+++ b/src/ray/test/run_object_manager_tests.sh
@@ -21,8 +21,9 @@ if [ ! -d "$RAY_ROOT/python" ]; then
 fi
 
 CORE_DIR="$RAY_ROOT/build"
-REDIS_MODULE="$CORE_DIR/src/common/redis_module/libray_redis_module.so"
-REDIS_DIR="$CORE_DIR/src/common/thirdparty/redis/src"
+PYTHON_CORE_DIR="$RAY_ROOT/python/ray/core"
+REDIS_MODULE="$PYTHON_CORE_DIR/src/ray/gcs/redis_module/libray_redis_module.so"
+REDIS_DIR="$CORE_DIR/src/ray/thirdparty/redis/src"
 
 if [[ "${RAY_USE_NEW_GCS}" = "on" ]]; then
     REDIS_SERVER="$CORE_DIR/src/credis/redis/src/redis-server"
@@ -34,7 +35,7 @@ else
     LOAD_MODULE_ARGS="--loadmodule ${REDIS_MODULE}"
 fi
 
-STORE_EXEC="$CORE_DIR/src/plasma/plasma_store_server"
+STORE_EXEC="$PYTHON_CORE_DIR/src/plasma/plasma_store_server"
 
 # Allow cleanup commands to fail.
 $REDIS_DIR/redis-cli -p 6379 shutdown || true
diff --git a/src/ray/test/run_object_manager_valgrind.sh b/src/ray/test/run_object_manager_valgrind.sh
index 23474c26d44ad..943e629a37d18 100644
--- a/src/ray/test/run_object_manager_valgrind.sh
+++ b/src/ray/test/run_object_manager_valgrind.sh
@@ -21,9 +21,10 @@ if [ ! -d "$RAY_ROOT/python" ]; then
 fi
 
 CORE_DIR="$RAY_ROOT/build"
-REDIS_DIR="$CORE_DIR/src/common/thirdparty/redis/src"
-REDIS_MODULE="$CORE_DIR/src/common/redis_module/libray_redis_module.so"
-STORE_EXEC="$CORE_DIR/src/plasma/plasma_store_server"
+PYTHON_CORE_DIR="$RAY_ROOT/python/ray/core"
+REDIS_DIR="$CORE_DIR/src/ray/thirdparty/redis/src"
+REDIS_MODULE="$PYTHON_CORE_DIR/src/ray/gcs/redis_module/libray_redis_module.so"
+STORE_EXEC="$PYTHON_CORE_DIR/src/plasma/plasma_store_server"
 VALGRIND_CMD="valgrind --track-origins=yes --leak-check=full --show-leak-kinds=all --leak-check-heuristics=stdstring --error-exitcode=1"
 
 if [[ "${RAY_USE_NEW_GCS}" = "on" ]]; then
diff --git a/src/common/thirdparty/ae/ae.c b/src/ray/thirdparty/ae/ae.c
similarity index 100%
rename from src/common/thirdparty/ae/ae.c
rename to src/ray/thirdparty/ae/ae.c
diff --git a/src/common/thirdparty/ae/ae.h b/src/ray/thirdparty/ae/ae.h
similarity index 100%
rename from src/common/thirdparty/ae/ae.h
rename to src/ray/thirdparty/ae/ae.h
diff --git a/src/common/thirdparty/ae/ae_epoll.c b/src/ray/thirdparty/ae/ae_epoll.c
similarity index 100%
rename from src/common/thirdparty/ae/ae_epoll.c
rename to src/ray/thirdparty/ae/ae_epoll.c
diff --git a/src/common/thirdparty/ae/ae_evport.c b/src/ray/thirdparty/ae/ae_evport.c
similarity index 100%
rename from src/common/thirdparty/ae/ae_evport.c
rename to src/ray/thirdparty/ae/ae_evport.c
diff --git a/src/common/thirdparty/ae/ae_kqueue.c b/src/ray/thirdparty/ae/ae_kqueue.c
similarity index 100%
rename from src/common/thirdparty/ae/ae_kqueue.c
rename to src/ray/thirdparty/ae/ae_kqueue.c
diff --git a/src/common/thirdparty/ae/ae_select.c b/src/ray/thirdparty/ae/ae_select.c
similarity index 100%
rename from src/common/thirdparty/ae/ae_select.c
rename to src/ray/thirdparty/ae/ae_select.c
diff --git a/src/common/thirdparty/ae/config.h b/src/ray/thirdparty/ae/config.h
similarity index 100%
rename from src/common/thirdparty/ae/config.h
rename to src/ray/thirdparty/ae/config.h
diff --git a/src/common/thirdparty/ae/zmalloc.h b/src/ray/thirdparty/ae/zmalloc.h
similarity index 100%
rename from src/common/thirdparty/ae/zmalloc.h
rename to src/ray/thirdparty/ae/zmalloc.h
diff --git a/src/common/thirdparty/hiredis/.gitignore b/src/ray/thirdparty/hiredis/.gitignore
similarity index 100%
rename from src/common/thirdparty/hiredis/.gitignore
rename to src/ray/thirdparty/hiredis/.gitignore
diff --git a/src/common/thirdparty/hiredis/.travis.yml b/src/ray/thirdparty/hiredis/.travis.yml
similarity index 100%
rename from src/common/thirdparty/hiredis/.travis.yml
rename to src/ray/thirdparty/hiredis/.travis.yml
diff --git a/src/common/thirdparty/hiredis/CHANGELOG.md b/src/ray/thirdparty/hiredis/CHANGELOG.md
similarity index 100%
rename from src/common/thirdparty/hiredis/CHANGELOG.md
rename to src/ray/thirdparty/hiredis/CHANGELOG.md
diff --git a/src/common/thirdparty/hiredis/COPYING b/src/ray/thirdparty/hiredis/COPYING
similarity index 100%
rename from src/common/thirdparty/hiredis/COPYING
rename to src/ray/thirdparty/hiredis/COPYING
diff --git a/src/common/thirdparty/hiredis/Makefile b/src/ray/thirdparty/hiredis/Makefile
similarity index 100%
rename from src/common/thirdparty/hiredis/Makefile
rename to src/ray/thirdparty/hiredis/Makefile
diff --git a/src/common/thirdparty/hiredis/README.md b/src/ray/thirdparty/hiredis/README.md
similarity index 100%
rename from src/common/thirdparty/hiredis/README.md
rename to src/ray/thirdparty/hiredis/README.md
diff --git a/src/common/thirdparty/hiredis/adapters/ae.h b/src/ray/thirdparty/hiredis/adapters/ae.h
similarity index 100%
rename from src/common/thirdparty/hiredis/adapters/ae.h
rename to src/ray/thirdparty/hiredis/adapters/ae.h
diff --git a/src/common/thirdparty/hiredis/adapters/glib.h b/src/ray/thirdparty/hiredis/adapters/glib.h
similarity index 100%
rename from src/common/thirdparty/hiredis/adapters/glib.h
rename to src/ray/thirdparty/hiredis/adapters/glib.h
diff --git a/src/common/thirdparty/hiredis/adapters/ivykis.h b/src/ray/thirdparty/hiredis/adapters/ivykis.h
similarity index 100%
rename from src/common/thirdparty/hiredis/adapters/ivykis.h
rename to src/ray/thirdparty/hiredis/adapters/ivykis.h
diff --git a/src/common/thirdparty/hiredis/adapters/libev.h b/src/ray/thirdparty/hiredis/adapters/libev.h
similarity index 100%
rename from src/common/thirdparty/hiredis/adapters/libev.h
rename to src/ray/thirdparty/hiredis/adapters/libev.h
diff --git a/src/common/thirdparty/hiredis/adapters/libevent.h b/src/ray/thirdparty/hiredis/adapters/libevent.h
similarity index 100%
rename from src/common/thirdparty/hiredis/adapters/libevent.h
rename to src/ray/thirdparty/hiredis/adapters/libevent.h
diff --git a/src/common/thirdparty/hiredis/adapters/libuv.h b/src/ray/thirdparty/hiredis/adapters/libuv.h
similarity index 100%
rename from src/common/thirdparty/hiredis/adapters/libuv.h
rename to src/ray/thirdparty/hiredis/adapters/libuv.h
diff --git a/src/common/thirdparty/hiredis/adapters/macosx.h b/src/ray/thirdparty/hiredis/adapters/macosx.h
similarity index 100%
rename from src/common/thirdparty/hiredis/adapters/macosx.h
rename to src/ray/thirdparty/hiredis/adapters/macosx.h
diff --git a/src/common/thirdparty/hiredis/adapters/qt.h b/src/ray/thirdparty/hiredis/adapters/qt.h
similarity index 100%
rename from src/common/thirdparty/hiredis/adapters/qt.h
rename to src/ray/thirdparty/hiredis/adapters/qt.h
diff --git a/src/common/thirdparty/hiredis/async.c b/src/ray/thirdparty/hiredis/async.c
similarity index 100%
rename from src/common/thirdparty/hiredis/async.c
rename to src/ray/thirdparty/hiredis/async.c
diff --git a/src/common/thirdparty/hiredis/async.h b/src/ray/thirdparty/hiredis/async.h
similarity index 100%
rename from src/common/thirdparty/hiredis/async.h
rename to src/ray/thirdparty/hiredis/async.h
diff --git a/src/common/thirdparty/hiredis/dict.c b/src/ray/thirdparty/hiredis/dict.c
similarity index 100%
rename from src/common/thirdparty/hiredis/dict.c
rename to src/ray/thirdparty/hiredis/dict.c
diff --git a/src/common/thirdparty/hiredis/dict.h b/src/ray/thirdparty/hiredis/dict.h
similarity index 100%
rename from src/common/thirdparty/hiredis/dict.h
rename to src/ray/thirdparty/hiredis/dict.h
diff --git a/src/common/thirdparty/hiredis/examples/example-ae.c b/src/ray/thirdparty/hiredis/examples/example-ae.c
similarity index 100%
rename from src/common/thirdparty/hiredis/examples/example-ae.c
rename to src/ray/thirdparty/hiredis/examples/example-ae.c
diff --git a/src/common/thirdparty/hiredis/examples/example-glib.c b/src/ray/thirdparty/hiredis/examples/example-glib.c
similarity index 100%
rename from src/common/thirdparty/hiredis/examples/example-glib.c
rename to src/ray/thirdparty/hiredis/examples/example-glib.c
diff --git a/src/common/thirdparty/hiredis/examples/example-ivykis.c b/src/ray/thirdparty/hiredis/examples/example-ivykis.c
similarity index 100%
rename from src/common/thirdparty/hiredis/examples/example-ivykis.c
rename to src/ray/thirdparty/hiredis/examples/example-ivykis.c
diff --git a/src/common/thirdparty/hiredis/examples/example-libev.c b/src/ray/thirdparty/hiredis/examples/example-libev.c
similarity index 100%
rename from src/common/thirdparty/hiredis/examples/example-libev.c
rename to src/ray/thirdparty/hiredis/examples/example-libev.c
diff --git a/src/common/thirdparty/hiredis/examples/example-libevent.c b/src/ray/thirdparty/hiredis/examples/example-libevent.c
similarity index 100%
rename from src/common/thirdparty/hiredis/examples/example-libevent.c
rename to src/ray/thirdparty/hiredis/examples/example-libevent.c
diff --git a/src/common/thirdparty/hiredis/examples/example-libuv.c b/src/ray/thirdparty/hiredis/examples/example-libuv.c
similarity index 100%
rename from src/common/thirdparty/hiredis/examples/example-libuv.c
rename to src/ray/thirdparty/hiredis/examples/example-libuv.c
diff --git a/src/common/thirdparty/hiredis/examples/example-macosx.c b/src/ray/thirdparty/hiredis/examples/example-macosx.c
similarity index 100%
rename from src/common/thirdparty/hiredis/examples/example-macosx.c
rename to src/ray/thirdparty/hiredis/examples/example-macosx.c
diff --git a/src/common/thirdparty/hiredis/examples/example-qt.cpp b/src/ray/thirdparty/hiredis/examples/example-qt.cpp
similarity index 100%
rename from src/common/thirdparty/hiredis/examples/example-qt.cpp
rename to src/ray/thirdparty/hiredis/examples/example-qt.cpp
diff --git a/src/common/thirdparty/hiredis/examples/example-qt.h b/src/ray/thirdparty/hiredis/examples/example-qt.h
similarity index 100%
rename from src/common/thirdparty/hiredis/examples/example-qt.h
rename to src/ray/thirdparty/hiredis/examples/example-qt.h
diff --git a/src/common/thirdparty/hiredis/examples/example.c b/src/ray/thirdparty/hiredis/examples/example.c
similarity index 100%
rename from src/common/thirdparty/hiredis/examples/example.c
rename to src/ray/thirdparty/hiredis/examples/example.c
diff --git a/src/common/thirdparty/hiredis/fmacros.h b/src/ray/thirdparty/hiredis/fmacros.h
similarity index 100%
rename from src/common/thirdparty/hiredis/fmacros.h
rename to src/ray/thirdparty/hiredis/fmacros.h
diff --git a/src/common/thirdparty/hiredis/hiredis.c b/src/ray/thirdparty/hiredis/hiredis.c
similarity index 100%
rename from src/common/thirdparty/hiredis/hiredis.c
rename to src/ray/thirdparty/hiredis/hiredis.c
diff --git a/src/common/thirdparty/hiredis/hiredis.h b/src/ray/thirdparty/hiredis/hiredis.h
similarity index 100%
rename from src/common/thirdparty/hiredis/hiredis.h
rename to src/ray/thirdparty/hiredis/hiredis.h
diff --git a/src/common/thirdparty/hiredis/net.c b/src/ray/thirdparty/hiredis/net.c
similarity index 100%
rename from src/common/thirdparty/hiredis/net.c
rename to src/ray/thirdparty/hiredis/net.c
diff --git a/src/common/thirdparty/hiredis/net.h b/src/ray/thirdparty/hiredis/net.h
similarity index 100%
rename from src/common/thirdparty/hiredis/net.h
rename to src/ray/thirdparty/hiredis/net.h
diff --git a/src/common/thirdparty/hiredis/read.c b/src/ray/thirdparty/hiredis/read.c
similarity index 100%
rename from src/common/thirdparty/hiredis/read.c
rename to src/ray/thirdparty/hiredis/read.c
diff --git a/src/common/thirdparty/hiredis/read.h b/src/ray/thirdparty/hiredis/read.h
similarity index 100%
rename from src/common/thirdparty/hiredis/read.h
rename to src/ray/thirdparty/hiredis/read.h
diff --git a/src/common/thirdparty/hiredis/sds.c b/src/ray/thirdparty/hiredis/sds.c
similarity index 100%
rename from src/common/thirdparty/hiredis/sds.c
rename to src/ray/thirdparty/hiredis/sds.c
diff --git a/src/common/thirdparty/hiredis/sds.h b/src/ray/thirdparty/hiredis/sds.h
similarity index 100%
rename from src/common/thirdparty/hiredis/sds.h
rename to src/ray/thirdparty/hiredis/sds.h
diff --git a/src/common/thirdparty/hiredis/test.c b/src/ray/thirdparty/hiredis/test.c
similarity index 100%
rename from src/common/thirdparty/hiredis/test.c
rename to src/ray/thirdparty/hiredis/test.c
diff --git a/src/common/thirdparty/hiredis/win32.h b/src/ray/thirdparty/hiredis/win32.h
similarity index 100%
rename from src/common/thirdparty/hiredis/win32.h
rename to src/ray/thirdparty/hiredis/win32.h
diff --git a/src/common/thirdparty/sha256.c b/src/ray/thirdparty/sha256.c
similarity index 100%
rename from src/common/thirdparty/sha256.c
rename to src/ray/thirdparty/sha256.c
diff --git a/src/common/thirdparty/sha256.h b/src/ray/thirdparty/sha256.h
similarity index 100%
rename from src/common/thirdparty/sha256.h
rename to src/ray/thirdparty/sha256.h
diff --git a/src/ray/util/logging.cc b/src/ray/util/logging.cc
index ee42e7e3ab2f8..b10c245e73ecf 100644
--- a/src/ray/util/logging.cc
+++ b/src/ray/util/logging.cc
@@ -1,8 +1,12 @@
+#include "ray/util/logging.h"
+
+#ifndef _WIN32
+#include <execinfo.h>
+#endif
+#include <stdlib.h>
 #include <cstdlib>
 #include <iostream>
 
-#include "ray/util/logging.h"
-
 #ifdef RAY_USE_GLOG
 #include "glog/logging.h"
 #endif
@@ -13,13 +17,13 @@ namespace ray {
 // which is independent of any libs.
 class CerrLog {
  public:
-  CerrLog(int severity) : severity_(severity), has_logged_(false) {}
+  CerrLog(RayLogLevel severity) : severity_(severity), has_logged_(false) {}
 
   virtual ~CerrLog() {
     if (has_logged_) {
       std::cerr << std::endl;
     }
-    if (severity_ == RAY_FATAL) {
+    if (severity_ == RayLogLevel::FATAL) {
       PrintBackTrace();
       std::abort();
     }
@@ -32,7 +36,7 @@ class CerrLog {
 
   template <class T>
   CerrLog &operator<<(const T &t) {
-    if (severity_ != RAY_DEBUG) {
+    if (severity_ != RayLogLevel::DEBUG) {
       has_logged_ = true;
       std::cerr << t;
     }
@@ -40,7 +44,7 @@ class CerrLog {
   }
 
  protected:
-  const int severity_;
+  const RayLogLevel severity_;
   bool has_logged_;
 
   void PrintBackTrace() {
@@ -52,27 +56,33 @@ class CerrLog {
   }
 };
 
-int RayLog::severity_threshold_ = RAY_INFO;
+#ifdef RAY_USE_GLOG
+typedef google::LogMessage LoggingProvider;
+#else
+typedef ray::CerrLog LoggingProvider;
+#endif
+
+RayLogLevel RayLog::severity_threshold_ = RayLogLevel::INFO;
 std::string RayLog::app_name_ = "";
 
 #ifdef RAY_USE_GLOG
 using namespace google;
 
 // Glog's severity map.
-static int GetMappedSeverity(int severity) {
+static int GetMappedSeverity(RayLogLevel severity) {
   switch (severity) {
-  case RAY_DEBUG:
+  case RayLogLevel::DEBUG:
     return GLOG_INFO;
-  case RAY_INFO:
+  case RayLogLevel::INFO:
     return GLOG_INFO;
-  case RAY_WARNING:
+  case RayLogLevel::WARNING:
     return GLOG_WARNING;
-  case RAY_ERROR:
+  case RayLogLevel::ERROR:
     return GLOG_ERROR;
-  case RAY_FATAL:
+  case RayLogLevel::FATAL:
     return GLOG_FATAL;
   default:
-    RAY_LOG(FATAL) << "Unsupported logging level: " << severity;
+    RAY_LOG(FATAL) << "Unsupported logging level: " << static_cast<int>(severity);
     // This return won't be hit but compiler needs it.
     return GLOG_FATAL;
   }
@@ -80,11 +90,11 @@ static int GetMappedSeverity(int severity) {
 
 #endif
 
-void RayLog::StartRayLog(const std::string &app_name, int severity_threshold,
+void RayLog::StartRayLog(const std::string &app_name, RayLogLevel severity_threshold,
                          const std::string &log_dir) {
-#ifdef RAY_USE_GLOG
   severity_threshold_ = severity_threshold;
   app_name_ = app_name;
+#ifdef RAY_USE_GLOG
   int mapped_severity_threshold = GetMappedSeverity(severity_threshold_);
   google::InitGoogleLogging(app_name_.c_str());
   google::SetStderrLogging(mapped_severity_threshold);
@@ -122,34 +132,44 @@ void RayLog::InstallFailureSignalHandler() {
 #endif
 }
 
-bool RayLog::IsLevelEnabled(int log_level) { return log_level >= severity_threshold_; }
+bool RayLog::IsLevelEnabled(RayLogLevel log_level) {
+  return log_level >= severity_threshold_;
+}
 
-RayLog::RayLog(const char *file_name, int line_number, int severity)
-    // glog does not have DEBUG level, we can handle it here.
-    : is_enabled_(severity >= severity_threshold_) {
+RayLog::RayLog(const char *file_name, int line_number, RayLogLevel severity)
+    // glog does not have DEBUG level, we can handle it using is_enabled_.
+    : logging_provider_(nullptr),
+      is_enabled_(severity >= severity_threshold_) {
 #ifdef RAY_USE_GLOG
   if (is_enabled_) {
-    logging_provider_.reset(
-        new google::LogMessage(file_name, line_number, GetMappedSeverity(severity)));
+    logging_provider_ =
+        new google::LogMessage(file_name, line_number, GetMappedSeverity(severity));
   }
 #else
-  logging_provider_.reset(new CerrLog(severity));
-  *logging_provider_ << file_name << ":" << line_number << ": ";
+  auto logging_provider = new CerrLog(severity);
+  *logging_provider << file_name << ":" << line_number << ": ";
+  logging_provider_ = logging_provider;
 #endif
 }
 
 std::ostream &RayLog::Stream() {
+  auto logging_provider = reinterpret_cast<LoggingProvider *>(logging_provider_);
 #ifdef RAY_USE_GLOG
   // Before calling this function, user should check IsEnabled.
   // When IsEnabled == false, logging_provider_ will be empty.
-  return logging_provider_->stream();
+  return logging_provider->stream();
 #else
-  return logging_provider_->Stream();
+  return logging_provider->Stream();
 #endif
 }
 
 bool RayLog::IsEnabled() const { return is_enabled_; }
 
-RayLog::~RayLog() { logging_provider_.reset(); }
+RayLog::~RayLog() {
+  if (logging_provider_ != nullptr) {
+    delete reinterpret_cast<LoggingProvider *>(logging_provider_);
+    logging_provider_ = nullptr;
+  }
+}
 
 }  // namespace ray
diff --git a/src/ray/util/logging.h b/src/ray/util/logging.h
index daaa92369e1ec..00c934c68a370 100644
--- a/src/ray/util/logging.h
+++ b/src/ray/util/logging.h
@@ -1,49 +1,26 @@
 #ifndef RAY_UTIL_LOGGING_H
 #define RAY_UTIL_LOGGING_H
 
-#ifndef _WIN32
-#include <execinfo.h>
-#endif
-
-#include <cstdlib>
 #include <iostream>
-#include <memory>
-
-#include "ray/util/macros.h"
+#include <string>
 
-// Forward declaration for the log provider.
-#ifdef RAY_USE_GLOG
-namespace google {
-class LogMessage;
-}  // namespace google
-typedef google::LogMessage LoggingProvider;
-#else
 namespace ray {
-class CerrLog;
-}  // namespace ray
-typedef ray::CerrLog LoggingProvider;
-#endif
 
-namespace ray {
-// Log levels. LOG ignores them, so their values are abitrary.
-
-#define RAY_DEBUG (-1)
-#define RAY_INFO 0
-#define RAY_WARNING 1
-#define RAY_ERROR 2
-#define RAY_FATAL 3
+enum class RayLogLevel { DEBUG = -1, INFO = 0, WARNING = 1, ERROR = 2, FATAL = 3 };
 
 #define RAY_LOG_INTERNAL(level) ::ray::RayLog(__FILE__, __LINE__, level)
 
-#define RAY_LOG(level) \
-  if (ray::RayLog::IsLevelEnabled(RAY_##level)) RAY_LOG_INTERNAL(RAY_##level)
+#define RAY_LOG(level)                                      \
+  if (ray::RayLog::IsLevelEnabled(ray::RayLogLevel::level)) \
+  RAY_LOG_INTERNAL(ray::RayLogLevel::level)
 
 #define RAY_IGNORE_EXPR(expr) ((void)(expr))
 
-#define RAY_CHECK(condition)                                                          \
-  (condition) ? RAY_IGNORE_EXPR(0) : ::ray::Voidify() &                               \
-                                         ::ray::RayLog(__FILE__, __LINE__, RAY_FATAL) \
-                                             << " Check failed: " #condition " "
+#define RAY_CHECK(condition)                                                   \
+  (condition) ? RAY_IGNORE_EXPR(0)                                             \
+              : ::ray::Voidify() &                                             \
+                    ::ray::RayLog(__FILE__, __LINE__, ray::RayLogLevel::FATAL) \
+                        << " Check failed: " #condition " "
 
 #ifdef NDEBUG
 
@@ -67,14 +44,13 @@ class RayLogBase {
  public:
   virtual ~RayLogBase(){};
 
+  // By default, this class is a null log because it return false here.
   virtual bool IsEnabled() const { return false; };
 
   template <typename T>
   RayLogBase &operator<<(const T &t) {
     if (IsEnabled()) {
       Stream() << t;
-    } else {
-      RAY_IGNORE_EXPR(t);
     }
     return *this;
   }
@@ -85,7 +61,7 @@ class RayLogBase {
 
 class RayLog : public RayLogBase {
  public:
-  RayLog(const char *file_name, int line_number, int severity);
+  RayLog(const char *file_name, int line_number, RayLogLevel severity);
 
   virtual ~RayLog();
 
@@ -94,29 +70,37 @@ class RayLog : public RayLogBase {
   /// \return True if logging is enabled and false otherwise.
   virtual bool IsEnabled() const;
 
-  // The init function of ray log for a program which should be called only once.
-  // If logDir is empty, the log won't output to file.
-  static void StartRayLog(const std::string &appName, int severity_threshold = RAY_ERROR,
+  /// The init function of ray log for a program which should be called only once.
+  ///
+  /// \parem appName The app name which starts the log.
+  /// \param severity_threshold Logging threshold for the program.
+  /// \param logDir Logging output file name. If empty, the log won't output to file.
+  static void StartRayLog(const std::string &appName,
+                          RayLogLevel severity_threshold = RayLogLevel::INFO,
                           const std::string &logDir = "");
 
-  // The shutdown function of ray log which should be used with StartRayLog as a pair.
+  /// The shutdown function of ray log which should be used with StartRayLog as a pair.
   static void ShutDownRayLog();
 
   /// Return whether or not the log level is enabled in current setting.
   ///
   /// \param log_level The input log level to test.
   /// \return True if input log level is not lower than the threshold.
-  static bool IsLevelEnabled(int log_level);
+  static bool IsLevelEnabled(RayLogLevel log_level);
 
-  // Install the failure signal handler to output call stack when crash.
-  // If glog is not installed, this function won't do anything.
+  /// Install the failure signal handler to output call stack when crash.
+  /// If glog is not installed, this function won't do anything.
   static void InstallFailureSignalHandler();
+  // Get the log level from environment variable.
+  static RayLogLevel GetLogLevelFromEnv();
 
  private:
-  std::unique_ptr<LoggingProvider> logging_provider_;
+  // Hide the implementation of log provider by void *.
+  // Otherwise, lib user may define the same macro to use the correct header file.
+  void *logging_provider_;
   /// True if log messages should be logged and false if they should be ignored.
   bool is_enabled_;
-  static int severity_threshold_;
+  static RayLogLevel severity_threshold_;
   // In InitGoogleLogging, it simply keeps the pointer.
   // We need to make sure the app name passed to InitGoogleLogging exist.
   static std::string app_name_;
diff --git a/src/ray/util/logging_test.cc b/src/ray/util/logging_test.cc
index a27a0625033f3..85fc5ee064544 100644
--- a/src/ray/util/logging_test.cc
+++ b/src/ray/util/logging_test.cc
@@ -41,14 +41,14 @@ TEST(PrintLogTest, LogTestWithoutInit) {
 
 TEST(PrintLogTest, LogTestWithInit) {
   // Test empty app name.
-  RayLog::StartRayLog("", RAY_DEBUG);
+  RayLog::StartRayLog("", RayLogLevel::DEBUG);
   PrintLog();
   RayLog::ShutDownRayLog();
 }
 
 // This test will output large amount of logs to stderr, should be disabled in travis.
 TEST(LogPerfTest, PerfTest) {
-  RayLog::StartRayLog("/fake/path/to/appdire/LogPerfTest", RAY_ERROR, "/tmp/");
+  RayLog::StartRayLog("/fake/path/to/appdire/LogPerfTest", RayLogLevel::ERROR, "/tmp/");
   int rounds = 100000;
 
   int64_t start_time = current_time_ms();
diff --git a/src/ray/util/ordered_set.h b/src/ray/util/ordered_set.h
new file mode 100644
index 0000000000000..03c0120ea4646
--- /dev/null
+++ b/src/ray/util/ordered_set.h
@@ -0,0 +1,71 @@
+#ifndef RAY_UTIL_ORDERED_SET_H
+#define RAY_UTIL_ORDERED_SET_H
+
+#include <list>
+#include <unordered_map>
+
+/// \class ordered_set
+///
+/// This container has properties of both a deque and a set. It is like a deque
+/// in the sense that it maintains the insertion order and allows you to
+/// push_back elements and pop_front elements. It is like a set in the sense
+/// that it does not allow duplicate entries. Looking up and erasing elements is
+/// quick.
+template <typename T>
+class ordered_set {
+ private:
+  using elements_type = std::list<T>;
+  using positions_type = std::unordered_map<T, typename elements_type::iterator>;
+  using iterator = typename elements_type::iterator;
+  using const_iterator = typename elements_type::const_iterator;
+
+ public:
+  ordered_set() {}
+
+  ordered_set(const ordered_set &other) = delete;
+
+  ordered_set &operator=(const ordered_set &other) = delete;
+
+  void push_back(const T &value) {
+    RAY_CHECK(positions_.find(value) == positions_.end());
+    auto list_iterator = elements_.insert(elements_.end(), value);
+    positions_[value] = list_iterator;
+  }
+
+  size_t count(const T &k) const { return positions_.count(k); }
+
+  void pop_front() {
+    positions_.erase(elements_.front());
+    elements_.pop_front();
+  }
+
+  const T &front() const { return elements_.front(); }
+
+  size_t size() const noexcept { return positions_.size(); }
+
+  size_t erase(const T &k) {
+    auto it = positions_.find(k);
+    RAY_CHECK(it != positions_.end());
+    elements_.erase(it->second);
+    return positions_.erase(k);
+  }
+
+  iterator erase(const iterator position) {
+    positions_.erase(*position);
+    return elements_.erase(position);
+  }
+
+  iterator begin() noexcept { return elements_.begin(); }
+
+  const_iterator begin() const noexcept { return elements_.begin(); }
+
+  iterator end() noexcept { return elements_.end(); }
+
+  const_iterator end() const noexcept { return elements_.end(); }
+
+ private:
+  elements_type elements_;
+  positions_type positions_;
+};
+
+#endif  // RAY_UTIL_ORDERED_SET_H
diff --git a/src/ray/util/signal_test.cc b/src/ray/util/signal_test.cc
index a408681d8f976..19e0aeec9ef7f 100644
--- a/src/ray/util/signal_test.cc
+++ b/src/ray/util/signal_test.cc
@@ -82,7 +82,8 @@ TEST(SignalTest, SIGILL_Test) {
 
 int main(int argc, char **argv) {
   InitShutdownRAII ray_log_shutdown_raii(ray::RayLog::StartRayLog,
-                                         ray::RayLog::ShutDownRayLog, argv[0], RAY_INFO,
+                                         ray::RayLog::ShutDownRayLog, argv[0],
+                                         ray::RayLogLevel::INFO,
                                          /*log_dir=*/"");
   ray::RayLog::InstallFailureSignalHandler();
   ::testing::InitGoogleTest(&argc, argv);
diff --git a/src/ray/util/util.h b/src/ray/util/util.h
index 1139b85e2659c..ba34cb7339e9d 100644
--- a/src/ray/util/util.h
+++ b/src/ray/util/util.h
@@ -29,6 +29,18 @@ inline int64_t current_sys_time_ms() {
   return ms_since_epoch.count();
 }
 
+inline int64_t current_sys_time_us() {
+  std::chrono::microseconds mu_since_epoch =
+      std::chrono::duration_cast<std::chrono::microseconds>(
+          std::chrono::system_clock::now().time_since_epoch());
+  return mu_since_epoch.count();
+}
+
+inline double current_sys_time_seconds() {
+  int64_t microseconds_in_seconds = 1000000;
+  return static_cast<double>(current_sys_time_us()) / microseconds_in_seconds;
+}
+
 inline ray::Status boost_to_ray_status(const boost::system::error_code &error) {
   switch (error.value()) {
   case boost::system::errc::success:
@@ -47,11 +59,11 @@ class InitShutdownRAII {
   /// function when it is out of scope.
   ///
   /// \param init_func The init function.
-  /// \param shuntdown_func The shutdown function.
-  /// \param args The auguments for the init function.
+  /// \param shutdown_func The shutdown function.
+  /// \param args The arguments for the init function.
   template <class InitFunc, class... Args>
-  InitShutdownRAII(InitFunc init_func, ShutdownFunc shuntdown_func, Args &&... args)
-      : shutdown_(shuntdown_func) {
+  InitShutdownRAII(InitFunc init_func, ShutdownFunc shutdown_func, Args &&... args)
+      : shutdown_(shutdown_func) {
     init_func(args...);
   }
 
diff --git a/test/actor_test.py b/test/actor_test.py
index 49d51835c31de..a9e3435635918 100644
--- a/test/actor_test.py
+++ b/test/actor_test.py
@@ -3,6 +3,7 @@
 from __future__ import print_function
 
 import collections
+import json
 import random
 import numpy as np
 import os
@@ -718,7 +719,7 @@ def test_actor_load_balancing(shutdown_only):
     num_local_schedulers = 3
     ray.worker._init(
         start_ray_local=True,
-        num_workers=0,
+        num_cpus=1,
         num_local_schedulers=num_local_schedulers)
 
     @ray.remote
@@ -764,7 +765,6 @@ def test_actor_gpus(shutdown_only):
     num_gpus_per_scheduler = 4
     ray.worker._init(
         start_ray_local=True,
-        num_workers=0,
         num_local_schedulers=num_local_schedulers,
         num_cpus=(num_local_schedulers * [10 * num_gpus_per_scheduler]),
         num_gpus=(num_local_schedulers * [num_gpus_per_scheduler]))
@@ -807,7 +807,6 @@ def test_actor_multiple_gpus(shutdown_only):
     num_gpus_per_scheduler = 5
     ray.worker._init(
         start_ray_local=True,
-        num_workers=0,
         num_local_schedulers=num_local_schedulers,
         num_cpus=(num_local_schedulers * [10 * num_gpus_per_scheduler]),
         num_gpus=(num_local_schedulers * [num_gpus_per_scheduler]))
@@ -878,7 +877,6 @@ def test_actor_different_numbers_of_gpus(shutdown_only):
     # numbers of GPUs.
     ray.worker._init(
         start_ray_local=True,
-        num_workers=0,
         num_local_schedulers=3,
         num_cpus=[10, 10, 10],
         num_gpus=[0, 5, 10])
@@ -915,21 +913,23 @@ def get_location_and_ids(self):
 
 
 def test_actor_multiple_gpus_from_multiple_tasks(shutdown_only):
-    num_local_schedulers = 10
-    num_gpus_per_scheduler = 10
+    num_local_schedulers = 5
+    num_gpus_per_scheduler = 5
     ray.worker._init(
         start_ray_local=True,
-        num_workers=0,
         num_local_schedulers=num_local_schedulers,
         redirect_output=True,
         num_cpus=(num_local_schedulers * [10 * num_gpus_per_scheduler]),
-        num_gpus=(num_local_schedulers * [num_gpus_per_scheduler]))
+        num_gpus=(num_local_schedulers * [num_gpus_per_scheduler]),
+        _internal_config=json.dumps({
+            "num_heartbeats_timeout": 1000
+        }))
 
     @ray.remote
-    def create_actors(n):
+    def create_actors(i, n):
         @ray.remote(num_gpus=1)
         class Actor(object):
-            def __init__(self):
+            def __init__(self, i, j):
                 self.gpu_ids = ray.get_gpu_ids()
 
             def get_location_and_ids(self):
@@ -937,15 +937,44 @@ def get_location_and_ids(self):
                     ray.worker.global_worker.plasma_client.store_socket_name),
                         tuple(self.gpu_ids))
 
+            def sleep(self):
+                time.sleep(100)
+
         # Create n actors.
-        for _ in range(n):
-            Actor.remote()
+        actors = []
+        for j in range(n):
+            actors.append(Actor.remote(i, j))
+
+        locations = ray.get(
+            [actor.get_location_and_ids.remote() for actor in actors])
 
-    ray.get([
-        create_actors.remote(num_gpus_per_scheduler)
-        for _ in range(num_local_schedulers)
+        # Put each actor to sleep for a long time to prevent them from getting
+        # terminated.
+        for actor in actors:
+            actor.sleep.remote()
+
+        return locations
+
+    all_locations = ray.get([
+        create_actors.remote(i, num_gpus_per_scheduler)
+        for i in range(num_local_schedulers)
     ])
 
+    # Make sure that no two actors are assigned to the same GPU.
+    node_names = {
+        location
+        for locations in all_locations for location, gpu_id in locations
+    }
+    assert len(node_names) == num_local_schedulers
+
+    # Keep track of which GPU IDs are being used for each location.
+    gpus_in_use = {node_name: [] for node_name in node_names}
+    for locations in all_locations:
+        for location, gpu_ids in locations:
+            gpus_in_use[location].extend(gpu_ids)
+    for node_name in node_names:
+        assert len(set(gpus_in_use[node_name])) == num_gpus_per_scheduler
+
     @ray.remote(num_gpus=1)
     class Actor(object):
         def __init__(self):
@@ -968,7 +997,6 @@ def test_actors_and_tasks_with_gpus(shutdown_only):
     num_gpus_per_scheduler = 6
     ray.worker._init(
         start_ray_local=True,
-        num_workers=0,
         num_local_schedulers=num_local_schedulers,
         num_cpus=num_gpus_per_scheduler,
         num_gpus=(num_local_schedulers * [num_gpus_per_scheduler]))
@@ -992,7 +1020,7 @@ def check_intervals_non_overlapping(list_of_intervals):
     @ray.remote(num_gpus=1)
     def f1():
         t1 = time.monotonic()
-        time.sleep(0.1)
+        time.sleep(0.2)
         t2 = time.monotonic()
         gpu_ids = ray.get_gpu_ids()
         assert len(gpu_ids) == 1
@@ -1003,7 +1031,7 @@ def f1():
     @ray.remote(num_gpus=2)
     def f2():
         t1 = time.monotonic()
-        time.sleep(0.1)
+        time.sleep(0.2)
         t2 = time.monotonic()
         gpu_ids = ray.get_gpu_ids()
         assert len(gpu_ids) == 2
@@ -1231,11 +1259,15 @@ def blocking_method(self):
     assert remaining_ids == [x_id]
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") != "1",
-    reason="This test only works with xray.")
 def test_exception_raised_when_actor_node_dies(shutdown_only):
-    ray.worker._init(start_ray_local=True, num_local_schedulers=2, num_cpus=1)
+    ray.worker._init(
+        start_ray_local=True,
+        num_local_schedulers=2,
+        num_cpus=1,
+        _internal_config=json.dumps({
+            "initial_reconstruction_timeout_milliseconds": 200,
+            "num_heartbeats_timeout": 10,
+        }))
 
     @ray.remote
     class Counter(object):
@@ -1262,11 +1294,11 @@ def inc(self):
         ray.services.PROCESS_TYPE_PLASMA_STORE][1]
     process.kill()
 
-    # Submit some new actor tasks.
-    x_ids = [actor.inc.remote() for _ in range(100)]
-
-    # Make sure that getting the result raises an exception.
+    # Submit some new actor tasks both before and after the node failure is
+    # detected. Make sure that getting the result raises an exception.
     for _ in range(10):
+        # Submit some new actor tasks.
+        x_ids = [actor.inc.remote() for _ in range(5)]
         for x_id in x_ids:
             with pytest.raises(ray.worker.RayGetError):
                 # There is some small chance that ray.get will actually
@@ -1278,9 +1310,7 @@ def inc(self):
     process.wait()
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Hanging with new GCS API.")
@@ -1288,7 +1318,7 @@ def test_local_scheduler_dying(shutdown_only):
     ray.worker._init(
         start_ray_local=True,
         num_local_schedulers=2,
-        num_workers=0,
+        num_cpus=1,
         redirect_output=True)
 
     @ray.remote
@@ -1328,9 +1358,7 @@ def inc(self):
     assert results == list(range(1, 1 + len(results)))
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Hanging with new GCS API.")
@@ -1406,7 +1434,7 @@ def setup_counter_actor(test_checkpoint=False,
     ray.worker._init(
         start_ray_local=True,
         num_local_schedulers=2,
-        num_workers=0,
+        num_cpus=1,
         redirect_output=True)
 
     # Only set the checkpoint interval if we're testing with checkpointing.
@@ -1465,9 +1493,7 @@ def __ray_restore__(self, checkpoint):
     return actor, ids
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Hanging with new GCS API.")
@@ -1495,9 +1521,7 @@ def test_checkpointing(shutdown_only):
     assert num_inc_calls < x
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Hanging with new GCS API.")
@@ -1526,9 +1550,7 @@ def test_remote_checkpoint(shutdown_only):
     assert x == 101
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Hanging with new GCS API.")
@@ -1557,9 +1579,7 @@ def test_lost_checkpoint(shutdown_only):
     assert 5 < num_inc_calls
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Hanging with new GCS API.")
@@ -1590,9 +1610,7 @@ def test_checkpoint_exception(shutdown_only):
         assert error["type"] == ray_constants.CHECKPOINT_PUSH_ERROR
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Hanging with new GCS API.")
@@ -1662,9 +1680,7 @@ def fork_many_incs(counter, num_incs):
     assert x == count + 1
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Hanging with new GCS API.")
@@ -1752,7 +1768,7 @@ def _test_nondeterministic_reconstruction(num_forks, num_items_per_fork,
     ray.worker._init(
         start_ray_local=True,
         num_local_schedulers=2,
-        num_workers=0,
+        num_cpus=1,
         redirect_output=True)
 
     # Make a shared queue.
@@ -1821,9 +1837,7 @@ def enqueue(queue, items):
     assert queue == reconstructed_queue[:len(queue)]
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Currently doesn't work with the new GCS.")
@@ -1859,9 +1873,6 @@ def read(self):
     ray.shutdown()
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
 def test_fork(setup_queue_actor):
     queue = setup_queue_actor
 
@@ -1878,9 +1889,6 @@ def fork(queue, key, item):
         assert filtered_items == list(range(1))
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
 def test_fork_consistency(setup_queue_actor):
     queue = setup_queue_actor
 
@@ -1968,6 +1976,28 @@ def method(self):
     ray.get(new_f.method.remote())
 
 
+def test_pickled_actor_handle_call_in_method_twice(ray_start_regular):
+    @ray.remote
+    class Actor1(object):
+        def f(self):
+            return 1
+
+    @ray.remote
+    class Actor2(object):
+        def __init__(self, constructor):
+            self.actor = constructor()
+
+        def step(self):
+            ray.get(self.actor.f.remote())
+
+    a = Actor1.remote()
+
+    b = Actor2.remote(lambda: a)
+
+    ray.get(b.step.remote())
+    ray.get(b.step.remote())
+
+
 def test_register_and_get_named_actors(ray_start_regular):
     # TODO(heyucongtom): We should test this from another driver.
 
@@ -2036,7 +2066,7 @@ def test_custom_label_placement(shutdown_only):
     ray.worker._init(
         start_ray_local=True,
         num_local_schedulers=2,
-        num_workers=0,
+        num_cpus=2,
         resources=[{
             "CustomResource1": 2
         }, {
@@ -2067,11 +2097,7 @@ def get_location(self):
 
 
 def test_creating_more_actors_than_resources(shutdown_only):
-    ray.init(
-        num_workers=0,
-        num_cpus=10,
-        num_gpus=2,
-        resources={"CustomResource1": 1})
+    ray.init(num_cpus=10, num_gpus=2, resources={"CustomResource1": 1})
 
     @ray.remote(num_gpus=1)
     class ResourceActor1(object):
diff --git a/test/component_failures_test.py b/test/component_failures_test.py
index 64dd3712b2e70..fd09a17599cfa 100644
--- a/test/component_failures_test.py
+++ b/test/component_failures_test.py
@@ -2,12 +2,18 @@
 from __future__ import division
 from __future__ import print_function
 
-import pytest
 import os
-import ray
+import json
+import signal
+import sys
 import time
 
-import pyarrow as pa
+import numpy as np
+import pytest
+
+import ray
+from ray.test.cluster_utils import Cluster
+from ray.test.test_utils import run_string_as_driver_nonblocking
 
 
 @pytest.fixture
@@ -23,76 +29,209 @@ def ray_start_workers_separate():
     ray.shutdown()
 
 
-# This test checks that when a worker dies in the middle of a get, the
-# plasma store and manager will not die.
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY", False),
-    reason="This test does not work with xray yet.")
+@pytest.fixture
+def shutdown_only():
+    yield None
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+
+
+@pytest.fixture
+def ray_start_cluster():
+    node_args = {
+        "resources": dict(CPU=8),
+        "_internal_config": json.dumps({
+            "initial_reconstruction_timeout_milliseconds": 1000,
+            "num_heartbeats_timeout": 10
+        })
+    }
+    # Start with 4 worker nodes and 8 cores each.
+    g = Cluster(initialize_head=True, connect=True, head_node_args=node_args)
+    workers = []
+    for _ in range(4):
+        workers.append(g.add_node(**node_args))
+    g.wait_for_nodes()
+    yield g
+    ray.shutdown()
+    g.shutdown()
+
+
+# This test checks that when a worker dies in the middle of a get, the plasma
+# store and raylet will not die.
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Not working with new GCS API.")
-def test_dying_worker_get(ray_start_workers_separate):
-    obj_id = 20 * b"a"
+def test_dying_worker_get(shutdown_only):
+    # Start the Ray processes.
+    ray.init(num_cpus=2)
+
+    @ray.remote
+    def sleep_forever():
+        time.sleep(10**6)
+
+    @ray.remote
+    def get_worker_pid():
+        return os.getpid()
+
+    x_id = sleep_forever.remote()
+    time.sleep(0.01)  # Try to wait for the sleep task to get scheduled.
+    # Get the PID of the other worker.
+    worker_pid = ray.get(get_worker_pid.remote())
 
     @ray.remote
-    def f():
-        ray.worker.global_worker.plasma_client.get(ray.ObjectID(obj_id))
+    def f(id_in_a_list):
+        ray.get(id_in_a_list[0])
 
     # Have the worker wait in a get call.
-    f.remote()
+    result_id = f.remote([x_id])
+    time.sleep(1)
+
+    # Make sure the task hasn't finished.
+    ready_ids, _ = ray.wait([result_id], timeout=0)
+    assert len(ready_ids) == 0
 
     # Kill the worker.
-    time.sleep(1)
-    (ray.services.all_processes[ray.services.PROCESS_TYPE_WORKER][0]
-     .terminate())
+    os.kill(worker_pid, signal.SIGKILL)
     time.sleep(0.1)
 
+    # Make sure the sleep task hasn't finished.
+    ready_ids, _ = ray.wait([x_id], timeout=0)
+    assert len(ready_ids) == 0
     # Seal the object so the store attempts to notify the worker that the
     # get has been fulfilled.
-    ray.worker.global_worker.plasma_client.create(
-        pa.plasma.ObjectID(obj_id), 100)
-    ray.worker.global_worker.plasma_client.seal(pa.plasma.ObjectID(obj_id))
+    ray.worker.global_worker.put_object(x_id, 1)
     time.sleep(0.1)
 
     # Make sure that nothing has died.
-    assert ray.services.all_processes_alive(
-        exclude=[ray.services.PROCESS_TYPE_WORKER])
+    assert ray.services.all_processes_alive()
 
 
-# This test checks that when a worker dies in the middle of a wait, the
-# plasma store and manager will not die.
+# This test checks that when a driver dies in the middle of a get, the plasma
+# store and raylet will not die.
 @pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY", False),
-    reason="This test does not work with xray yet.")
+    os.environ.get("RAY_USE_NEW_GCS") == "on",
+    reason="Not working with new GCS API.")
+def test_dying_driver_get(shutdown_only):
+    # Start the Ray processes.
+    address_info = ray.init(num_cpus=1)
+
+    @ray.remote
+    def sleep_forever():
+        time.sleep(10**6)
+
+    x_id = sleep_forever.remote()
+
+    driver = """
+import ray
+ray.init("{}")
+ray.get(ray.ObjectID(ray.utils.hex_to_binary("{}")))
+""".format(address_info["redis_address"], x_id.hex())
+
+    p = run_string_as_driver_nonblocking(driver)
+    # Make sure the driver is running.
+    time.sleep(1)
+    assert p.poll() is None
+
+    # Kill the driver process.
+    p.kill()
+    p.wait()
+    time.sleep(0.1)
+
+    # Make sure the original task hasn't finished.
+    ready_ids, _ = ray.wait([x_id], timeout=0)
+    assert len(ready_ids) == 0
+    # Seal the object so the store attempts to notify the worker that the
+    # get has been fulfilled.
+    ray.worker.global_worker.put_object(x_id, 1)
+    time.sleep(0.1)
+
+    # Make sure that nothing has died.
+    assert ray.services.all_processes_alive()
+
+
+# This test checks that when a worker dies in the middle of a wait, the plasma
+# store and raylet will not die.
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Not working with new GCS API.")
-def test_dying_worker_wait(ray_start_workers_separate):
-    obj_id = 20 * b"a"
+def test_dying_worker_wait(shutdown_only):
+    ray.init(num_cpus=2)
 
     @ray.remote
-    def f():
-        ray.worker.global_worker.plasma_client.wait([ray.ObjectID(obj_id)])
+    def sleep_forever():
+        time.sleep(10**6)
 
-    # Have the worker wait in a get call.
-    f.remote()
+    @ray.remote
+    def get_pid():
+        return os.getpid()
+
+    x_id = sleep_forever.remote()
+    # Get the PID of the worker that block_in_wait will run on (sleep a little
+    # to make sure that sleep_forever has already started).
+    time.sleep(0.1)
+    worker_pid = ray.get(get_pid.remote())
+
+    @ray.remote
+    def block_in_wait(object_id_in_list):
+        ray.wait(object_id_in_list)
+
+    # Have the worker wait in a wait call.
+    block_in_wait.remote([x_id])
+    time.sleep(0.1)
 
     # Kill the worker.
+    os.kill(worker_pid, signal.SIGKILL)
+    time.sleep(0.1)
+
+    # Create the object.
+    ray.worker.global_worker.put_object(x_id, 1)
+    time.sleep(0.1)
+
+    # Make sure that nothing has died.
+    assert ray.services.all_processes_alive()
+
+
+# This test checks that when a driver dies in the middle of a wait, the plasma
+# store and raylet will not die.
+@pytest.mark.skipif(
+    os.environ.get("RAY_USE_NEW_GCS") == "on",
+    reason="Not working with new GCS API.")
+def test_dying_driver_wait(shutdown_only):
+    # Start the Ray processes.
+    address_info = ray.init(num_cpus=1)
+
+    @ray.remote
+    def sleep_forever():
+        time.sleep(10**6)
+
+    x_id = sleep_forever.remote()
+
+    driver = """
+import ray
+ray.init("{}")
+ray.wait([ray.ObjectID(ray.utils.hex_to_binary("{}"))])
+""".format(address_info["redis_address"], x_id.hex())
+
+    p = run_string_as_driver_nonblocking(driver)
+    # Make sure the driver is running.
     time.sleep(1)
-    (ray.services.all_processes[ray.services.PROCESS_TYPE_WORKER][0]
-     .terminate())
+    assert p.poll() is None
+
+    # Kill the driver process.
+    p.kill()
+    p.wait()
     time.sleep(0.1)
 
+    # Make sure the original task hasn't finished.
+    ready_ids, _ = ray.wait([x_id], timeout=0)
+    assert len(ready_ids) == 0
     # Seal the object so the store attempts to notify the worker that the
-    # get has been fulfilled.
-    ray.worker.global_worker.plasma_client.create(
-        pa.plasma.ObjectID(obj_id), 100)
-    ray.worker.global_worker.plasma_client.seal(pa.plasma.ObjectID(obj_id))
+    # wait can return.
+    ray.worker.global_worker.put_object(x_id, 1)
     time.sleep(0.1)
 
     # Make sure that nothing has died.
-    assert ray.services.all_processes_alive(
-        exclude=[ray.services.PROCESS_TYPE_WORKER])
+    assert ray.services.all_processes_alive()
 
 
 @pytest.fixture(params=[(1, 4), (4, 4)])
@@ -101,7 +240,6 @@ def ray_start_workers_separate_multinode(request):
     num_initial_workers = request.param[1]
     # Start the Ray processes.
     ray.worker._init(
-        num_workers=(num_initial_workers * num_local_schedulers),
         num_local_schedulers=num_local_schedulers,
         start_workers_from_local_scheduler=False,
         start_ray_local=True,
@@ -141,98 +279,55 @@ def f(x):
 
 def _test_component_failed(component_type):
     """Kill a component on all worker nodes and check workload succeeds."""
-    # Raylet is able to pass a harder failure test than legacy ray.
-    use_raylet = os.environ.get("RAY_USE_XRAY") == "1"
-
     # Start with 4 workers and 4 cores.
     num_local_schedulers = 4
     num_workers_per_scheduler = 8
     ray.worker._init(
-        num_workers=num_workers_per_scheduler,
         num_local_schedulers=num_local_schedulers,
         start_ray_local=True,
         num_cpus=[num_workers_per_scheduler] * num_local_schedulers,
-        redirect_output=True)
+        redirect_output=True,
+        _internal_config=json.dumps({
+            "initial_reconstruction_timeout_milliseconds": 1000,
+            "num_heartbeats_timeout": 10,
+        }))
 
-    if use_raylet:
-        # Submit many tasks with many dependencies.
-        @ray.remote
-        def f(x):
-            return x
-
-        @ray.remote
-        def g(*xs):
-            return 1
-
-        # Kill the component on all nodes except the head node as the tasks
-        # execute. Do this in a loop while submitting tasks between each
-        # component failure.
-        # NOTE(swang): Legacy ray hangs on this test if the plasma manager
-        # is killed.
-        time.sleep(0.1)
-        components = ray.services.all_processes[component_type]
-        for process in components[1:]:
-            # Submit a round of tasks with many dependencies.
-            x = 1
-            for _ in range(1000):
-                x = f.remote(x)
-
-            xs = [g.remote(1)]
-            for _ in range(100):
-                xs.append(g.remote(*xs))
-                xs.append(g.remote(1))
-
-            # Kill a component on one of the nodes.
-            process.terminate()
-            time.sleep(1)
-            process.kill()
-            process.wait()
-            assert not process.poll() is None
-
-            # Make sure that we can still get the objects after the
-            # executing tasks died.
-            ray.get(x)
-            ray.get(xs)
-    else:
-
-        @ray.remote
-        def f(x, j):
-            time.sleep(0.2)
-            return x
-
-        # Submit more tasks than there are workers so that all workers and
-        # cores are utilized.
-        object_ids = [
-            f.remote(i, 0)
-            for i in range(num_workers_per_scheduler * num_local_schedulers)
-        ]
-        object_ids += [f.remote(object_id, 1) for object_id in object_ids]
-        object_ids += [f.remote(object_id, 2) for object_id in object_ids]
-
-        # Kill the component on all nodes except the head node as the tasks
-        # execute.
-        time.sleep(0.1)
-        components = ray.services.all_processes[component_type]
-        for process in components[1:]:
-            process.terminate()
-
-        # while the local_scheduler is fetching object_ids,
-        # and would trigger `fetch_object_timeout_handler`,
-        # which leads to find the plasma manager or plasma
-        # store socket is broken, so local_scheduler failed.
-        time.sleep(1)
+    # Submit many tasks with many dependencies.
+    @ray.remote
+    def f(x):
+        return x
+
+    @ray.remote
+    def g(*xs):
+        return 1
 
-        for process in components[1:]:
-            process.kill()
-            process.wait()
-            assert not process.poll() is None
+    # Kill the component on all nodes except the head node as the tasks
+    # execute. Do this in a loop while submitting tasks between each
+    # component failure.
+    time.sleep(0.1)
+    components = ray.services.all_processes[component_type]
+    for process in components[1:]:
+        # Submit a round of tasks with many dependencies.
+        x = 1
+        for _ in range(1000):
+            x = f.remote(x)
+
+        xs = [g.remote(1)]
+        for _ in range(100):
+            xs.append(g.remote(*xs))
+            xs.append(g.remote(1))
+
+        # Kill a component on one of the nodes.
+        process.terminate()
+        time.sleep(1)
+        process.kill()
+        process.wait()
+        assert not process.poll() is None
 
-        # Make sure that we can still get the objects after the executing
-        # tasks died.
-        results = ray.get(object_ids)
-        expected_results = 4 * list(
-            range(num_workers_per_scheduler * num_local_schedulers))
-        assert results == expected_results
+        # Make sure that we can still get the objects after the
+        # executing tasks died.
+        ray.get(x)
+        ray.get(xs)
 
 
 def check_components_alive(component_type, check_component_alive):
@@ -251,54 +346,12 @@ def check_components_alive(component_type, check_component_alive):
             assert not component.poll() is None
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") != "1",
-    reason="This test only makes sense with xray.")
 def test_raylet_failed():
     # Kill all local schedulers on worker nodes.
     _test_component_failed(ray.services.PROCESS_TYPE_RAYLET)
 
-    # The plasma stores and plasma managers should still be alive on the
-    # worker nodes.
-    check_components_alive(ray.services.PROCESS_TYPE_PLASMA_STORE, True)
-
-    ray.shutdown()
-
-
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not make sense with xray.")
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_NEW_GCS") == "on",
-    reason="Hanging with new GCS API.")
-def test_local_scheduler_failed():
-    # Kill all local schedulers on worker nodes.
-    _test_component_failed(ray.services.PROCESS_TYPE_LOCAL_SCHEDULER)
-
-    # The plasma stores and plasma managers should still be alive on the
-    # worker nodes.
+    # The plasma stores should still be alive on the worker nodes.
     check_components_alive(ray.services.PROCESS_TYPE_PLASMA_STORE, True)
-    check_components_alive(ray.services.PROCESS_TYPE_PLASMA_MANAGER, True)
-    check_components_alive(ray.services.PROCESS_TYPE_LOCAL_SCHEDULER, False)
-
-    ray.shutdown()
-
-
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not make sense with xray.")
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_NEW_GCS") == "on",
-    reason="Hanging with new GCS API.")
-def test_plasma_manager_failed():
-    # Kill all plasma managers on worker nodes.
-    _test_component_failed(ray.services.PROCESS_TYPE_PLASMA_MANAGER)
-
-    # The plasma stores should still be alive (but unreachable) on the
-    # worker nodes.
-    check_components_alive(ray.services.PROCESS_TYPE_PLASMA_STORE, True)
-    check_components_alive(ray.services.PROCESS_TYPE_PLASMA_MANAGER, False)
-    check_components_alive(ray.services.PROCESS_TYPE_LOCAL_SCHEDULER, False)
 
     ray.shutdown()
 
@@ -312,13 +365,56 @@ def test_plasma_store_failed():
 
     # No processes should be left alive on the worker nodes.
     check_components_alive(ray.services.PROCESS_TYPE_PLASMA_STORE, False)
-    check_components_alive(ray.services.PROCESS_TYPE_PLASMA_MANAGER, False)
-    check_components_alive(ray.services.PROCESS_TYPE_LOCAL_SCHEDULER, False)
     check_components_alive(ray.services.PROCESS_TYPE_RAYLET, False)
 
     ray.shutdown()
 
 
+def test_actor_creation_node_failure(ray_start_cluster):
+    # TODO(swang): Refactor test_raylet_failed, etc to reuse the below code.
+    cluster = ray_start_cluster
+
+    @ray.remote
+    class Child(object):
+        def __init__(self, death_probability):
+            self.death_probability = death_probability
+
+        def ping(self):
+            # Exit process with some probability.
+            exit_chance = np.random.rand()
+            if exit_chance < self.death_probability:
+                sys.exit(-1)
+
+    num_children = 100
+    # Children actors will die about half the time.
+    death_probability = 0.5
+
+    children = [Child.remote(death_probability) for _ in range(num_children)]
+    while len(cluster.list_all_nodes()) > 1:
+        for j in range(3):
+            # Submit some tasks on the actors. About half of the actors will
+            # fail.
+            children_out = [child.ping.remote() for child in children]
+            # Wait a while for all the tasks to complete. This should trigger
+            # reconstruction for any actor creation tasks that were forwarded
+            # to nodes that then failed.
+            ready, _ = ray.wait(
+                children_out,
+                num_returns=len(children_out),
+                timeout=5 * 60 * 1000)
+            assert len(ready) == len(children_out)
+
+            # Replace any actors that died.
+            for i, out in enumerate(children_out):
+                try:
+                    ray.get(out)
+                except ray.worker.RayGetError:
+                    children[i] = Child.remote(death_probability)
+        # Remove a node. Any actor creation tasks that were forwarded to this
+        # node must be reconstructed.
+        cluster.remove_node(cluster.list_all_nodes()[-1])
+
+
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Hanging with new GCS API.")
@@ -326,9 +422,6 @@ def test_driver_lives_sequential():
     ray.worker.init()
     all_processes = ray.services.all_processes
     processes = (all_processes[ray.services.PROCESS_TYPE_PLASMA_STORE] +
-                 all_processes[ray.services.PROCESS_TYPE_PLASMA_MANAGER] +
-                 all_processes[ray.services.PROCESS_TYPE_LOCAL_SCHEDULER] +
-                 all_processes[ray.services.PROCESS_TYPE_GLOBAL_SCHEDULER] +
                  all_processes[ray.services.PROCESS_TYPE_RAYLET])
 
     # Kill all the components sequentially.
@@ -349,9 +442,6 @@ def test_driver_lives_parallel():
     ray.worker.init()
     all_processes = ray.services.all_processes
     processes = (all_processes[ray.services.PROCESS_TYPE_PLASMA_STORE] +
-                 all_processes[ray.services.PROCESS_TYPE_PLASMA_MANAGER] +
-                 all_processes[ray.services.PROCESS_TYPE_LOCAL_SCHEDULER] +
-                 all_processes[ray.services.PROCESS_TYPE_GLOBAL_SCHEDULER] +
                  all_processes[ray.services.PROCESS_TYPE_RAYLET])
 
     # Kill all the components in parallel.
diff --git a/test/credis_test.py b/test/credis_test.py
index 316da135e7977..751a25a4ff54a 100644
--- a/test/credis_test.py
+++ b/test/credis_test.py
@@ -17,7 +17,7 @@ def parse_client(addr_port_str):
                  "Tests functionality of the new GCS.")
 class CredisTest(unittest.TestCase):
     def setUp(self):
-        self.config = ray.init(num_workers=0)
+        self.config = ray.init(num_cpus=0)
 
     def tearDown(self):
         ray.shutdown()
diff --git a/test/failure_test.py b/test/failure_test.py
index 149d4c74d4852..2c4a92bd496ca 100644
--- a/test/failure_test.py
+++ b/test/failure_test.py
@@ -3,6 +3,7 @@
 from __future__ import print_function
 
 import numpy as np
+import json
 import os
 import ray
 import sys
@@ -371,6 +372,19 @@ def getpid(self):
         ray.get(task2)
 
 
+def test_actor_scope_or_intentionally_killed_message(ray_start_regular):
+    @ray.remote
+    class Actor(object):
+        pass
+
+    a = Actor.remote()
+    a = Actor.remote()
+    a.__ray_terminate__.remote()
+    time.sleep(1)
+    assert len(ray.error_info()) == 0, (
+        "Should not have propogated an error - {}".format(ray.error_info()))
+
+
 @pytest.fixture
 def ray_start_object_store_memory():
     # Start the Ray processes.
@@ -381,9 +395,7 @@ def ray_start_object_store_memory():
     ray.shutdown()
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 def test_put_error1(ray_start_object_store_memory):
     num_objects = 3
     object_size = 4 * 10**5
@@ -425,9 +437,7 @@ def put_arg_task():
     wait_for_errors(ray_constants.PUT_RECONSTRUCTION_PUSH_ERROR, 1)
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 def test_put_error2(ray_start_object_store_memory):
     # This is the same as the previous test, but it calls ray.put directly.
     num_objects = 3
@@ -481,9 +491,6 @@ def test_version_mismatch(shutdown_only):
     ray.__version__ = ray_version
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") != "1",
-    reason="This test only works with xray.")
 def test_warning_monitor_died(shutdown_only):
     ray.init(num_cpus=0)
 
@@ -494,10 +501,10 @@ def test_warning_monitor_died(shutdown_only):
     # addition to the monitor.
     fake_id = 20 * b"\x00"
     malformed_message = "asdf"
-    redis_client = ray.worker.global_state.redis_clients[0]
+    redis_client = ray.worker.global_worker.redis_client
     redis_client.execute_command(
-        "RAY.TABLE_ADD", ray.gcs_utils.TablePrefix.HEARTBEAT,
-        ray.gcs_utils.TablePubsub.HEARTBEAT, fake_id, malformed_message)
+        "RAY.TABLE_ADD", ray.gcs_utils.TablePrefix.HEARTBEAT_BATCH,
+        ray.gcs_utils.TablePubsub.HEARTBEAT_BATCH, fake_id, malformed_message)
 
     wait_for_errors(ray_constants.MONITOR_DIED_ERROR, 1)
 
@@ -525,9 +532,6 @@ def __init__(self):
     wait_for_errors(ray_constants.PICKLING_LARGE_OBJECT_PUSH_ERROR, 2)
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") != "1",
-    reason="This test only works with xray.")
 def test_warning_for_infeasible_tasks(ray_start_regular):
     # Check that we get warning messages for infeasible tasks.
 
@@ -548,10 +552,32 @@ class Foo(object):
     wait_for_errors(ray_constants.INFEASIBLE_TASK_ERROR, 2)
 
 
+def test_warning_for_infeasible_zero_cpu_actor(shutdown_only):
+    # Check that we cannot place an actor on a 0 CPU machine and that we get an
+    # infeasibility warning (even though the actor creation task itself
+    # requires no CPUs).
+
+    ray.init(num_cpus=0)
+
+    @ray.remote
+    class Foo(object):
+        pass
+
+    # The actor creation should be infeasible.
+    Foo.remote()
+    wait_for_errors(ray_constants.INFEASIBLE_TASK_ERROR, 1)
+
+
 @pytest.fixture
 def ray_start_two_nodes():
     # Start the Ray processes.
-    ray.worker._init(start_ray_local=True, num_local_schedulers=2, num_cpus=0)
+    ray.worker._init(
+        start_ray_local=True,
+        num_local_schedulers=2,
+        num_cpus=0,
+        _internal_config=json.dumps({
+            "num_heartbeats_timeout": 40
+        }))
     yield None
     # The code after the yield will run as teardown code.
     ray.shutdown()
@@ -559,9 +585,6 @@ def ray_start_two_nodes():
 
 # Note that this test will take at least 10 seconds because it must wait for
 # the monitor to detect enough missed heartbeats.
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") != "1",
-    reason="This test only works with xray.")
 def test_warning_for_dead_node(ray_start_two_nodes):
     # Wait for the raylet to appear in the client table.
     while len(ray.global_state.client_table()) < 2:
@@ -578,7 +601,7 @@ def test_warning_for_dead_node(ray_start_two_nodes):
     ray.services.all_processes[ray.services.PROCESS_TYPE_RAYLET][0].kill()
 
     # Check that we get warning messages for both raylets.
-    wait_for_errors(ray_constants.REMOVED_NODE_ERROR, 2, timeout=20)
+    wait_for_errors(ray_constants.REMOVED_NODE_ERROR, 2, timeout=40)
 
     # Extract the client IDs from the error messages. This will need to be
     # changed if the error message changes.
diff --git a/test/jenkins_tests/multi_node_docker_test.py b/test/jenkins_tests/multi_node_docker_test.py
index 3b3a13fa38aca..4b22dafc74189 100644
--- a/test/jenkins_tests/multi_node_docker_test.py
+++ b/test/jenkins_tests/multi_node_docker_test.py
@@ -80,12 +80,11 @@ class DockerRunner(object):
             head node.
     """
 
-    def __init__(self, use_raylet):
+    def __init__(self):
         """Initialize the DockerRunner."""
         self.head_container_id = None
         self.worker_container_ids = []
         self.head_container_ip = None
-        self.use_raylet = use_raylet
 
     def _get_container_id(self, stdout_data):
         """Parse the docker container ID from stdout_data.
@@ -149,8 +148,6 @@ def _start_head_node(self, docker_image, mem_size, shm_size,
             "--num-cpus={}".format(num_cpus), "--num-gpus={}".format(num_gpus),
             "--no-ui"
         ])
-        if self.use_raylet:
-            command.append("--use-raylet")
         print("Starting head node with command:{}".format(command))
 
         proc = subprocess.Popen(
@@ -177,8 +174,6 @@ def _start_worker_node(self, docker_image, mem_size, shm_size, num_cpus,
             "--redis-address={:s}:6379".format(self.head_container_ip),
             "--num-cpus={}".format(num_cpus), "--num-gpus={}".format(num_gpus)
         ])
-        if self.use_raylet:
-            command.append("--use-raylet")
         print("Starting worker node with command:{}".format(command))
         proc = subprocess.Popen(
             command, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
@@ -325,19 +320,13 @@ def handler(signum, frame):
 
         # Start the different drivers.
         driver_processes = []
-        if self.use_raylet:
-            use_raylet_env = 1
-        else:
-            use_raylet_env = 0
         for i in range(len(driver_locations)):
             # Get the container ID to run the ith driver in.
             container_id = all_container_ids[driver_locations[i]]
             command = [
-                "docker", "exec", container_id, "/bin/bash",
-                "-c", ("RAY_REDIS_ADDRESS={}:6379 RAY_DRIVER_INDEX={} "
-                       "RAY_USE_XRAY={} python {}".format(
-                           self.head_container_ip, i, use_raylet_env,
-                           test_script))
+                "docker", "exec", container_id, "/bin/bash", "-c",
+                ("RAY_REDIS_ADDRESS={}:6379 RAY_DRIVER_INDEX={} "
+                 "python {}".format(self.head_container_ip, i, test_script))
             ]
             print("Starting driver with command {}.".format(test_script))
             # Start the driver.
@@ -404,8 +393,6 @@ def handler(signum, frame):
         "--development-mode",
         action="store_true",
         help="use local copies of the test scripts")
-    parser.add_argument(
-        "--use-raylet", action="store_true", help="use raylet mode in Docker")
     args = parser.parse_args()
 
     # Parse the number of CPUs and GPUs to use for each worker.
@@ -419,7 +406,7 @@ def handler(signum, frame):
     driver_locations = (None if args.driver_locations is None else
                         [int(i) for i in args.driver_locations.split(",")])
 
-    d = DockerRunner(args.use_raylet)
+    d = DockerRunner()
     d.start_ray(
         docker_image=args.docker_image,
         mem_size=args.mem_size,
diff --git a/test/jenkins_tests/multi_node_tests/large_memory_test.py b/test/jenkins_tests/multi_node_tests/large_memory_test.py
index 5b5ddaa065178..4ac34d2cfdf25 100644
--- a/test/jenkins_tests/multi_node_tests/large_memory_test.py
+++ b/test/jenkins_tests/multi_node_tests/large_memory_test.py
@@ -7,7 +7,7 @@
 import ray
 
 if __name__ == "__main__":
-    ray.init(num_workers=0)
+    ray.init(num_cpus=0)
 
     A = np.ones(2**31 + 1, dtype="int8")
     a = ray.put(A)
diff --git a/test/jenkins_tests/multi_node_tests/many_drivers_test.py b/test/jenkins_tests/multi_node_tests/many_drivers_test.py
index d00e84a58c0f3..94eeb4715e664 100644
--- a/test/jenkins_tests/multi_node_tests/many_drivers_test.py
+++ b/test/jenkins_tests/multi_node_tests/many_drivers_test.py
@@ -50,7 +50,7 @@ def try_to_create_actor(actor_class, timeout=500):
         while time.time() - start_time < timeout:
             try:
                 actor = actor_class.remote()
-            except Exception as e:
+            except Exception:
                 time.sleep(0.1)
             else:
                 return actor
diff --git a/test/jenkins_tests/multi_node_tests/remove_driver_test.py b/test/jenkins_tests/multi_node_tests/remove_driver_test.py
index 4b61634b30691..08a1006709974 100644
--- a/test/jenkins_tests/multi_node_tests/remove_driver_test.py
+++ b/test/jenkins_tests/multi_node_tests/remove_driver_test.py
@@ -199,7 +199,7 @@ def try_to_create_actor(actor_class, driver_index, actor_index,
             try:
                 actor = actor_class.remote(driver_index, actor_index,
                                            redis_address)
-            except Exception as e:
+            except Exception:
                 time.sleep(0.1)
             else:
                 return actor
diff --git a/test/jenkins_tests/multi_node_tests/test_rllib_eval.sh b/test/jenkins_tests/multi_node_tests/test_rllib_eval.sh
deleted file mode 100644
index c4505832c16ab..0000000000000
--- a/test/jenkins_tests/multi_node_tests/test_rllib_eval.sh
+++ /dev/null
@@ -1,23 +0,0 @@
-#!/bin/sh
-
-# TODO: Test AC3
-ALGS='DQN PPO'
-GYM_ENV='CartPole-v0'
-
-for ALG in $ALGS
-do
-  EXPERIMENT_NAME=$GYM_ENV'_'$ALG
-  python /ray/python/ray/rllib/train.py --run $ALG --env $GYM_ENV \
-    --stop '{"training_iteration": 2}' --experiment-name $EXPERIMENT_NAME \
-    --checkpoint-freq 1
-
-  EXPERIMENT_PATH='/tmp/ray/'$EXPERIMENT_NAME
-  CHECKPOINT_FOLDER=$(ls $EXPERIMENT_PATH)
-  CHECKPOINT=$EXPERIMENT_PATH'/'$CHECKPOINT_FOLDER'/checkpoint-1'
-
-  python /ray/python/ray/rllib/eval.py $CHECKPOINT --run $ALG \
-    --env $GYM_ENV --no-render
-
-  # Clean up
-  rm -rf $EXPERIMENT_PATH
-done
diff --git a/test/jenkins_tests/run_multi_node_tests.sh b/test/jenkins_tests/run_multi_node_tests.sh
index e12eca455c0bf..9fba8a0000076 100755
--- a/test/jenkins_tests/run_multi_node_tests.sh
+++ b/test/jenkins_tests/run_multi_node_tests.sh
@@ -6,213 +6,238 @@ set -e
 # Show explicitly which commands are currently running.
 set -x
 
+MEMORY_SIZE="20G"
+SHM_SIZE="20G"
+
 ROOT_DIR=$(cd "$(dirname "${BASH_SOURCE:-$0}")"; pwd)
 
 DOCKER_SHA=$($ROOT_DIR/../../build-docker.sh --output-sha --no-cache)
 echo "Using Docker image" $DOCKER_SHA
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env PongDeterministic-v0 \
     --run A3C \
     --stop '{"training_iteration": 2}' \
     --config '{"num_workers": 2}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env Pong-ram-v4 \
     --run A3C \
     --stop '{"training_iteration": 2}' \
     --config '{"num_workers": 2}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env PongDeterministic-v0 \
     --run A2C \
     --stop '{"training_iteration": 2}' \
     --config '{"num_workers": 2}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v1 \
     --run PPO \
     --stop '{"training_iteration": 2}' \
     --config '{"kl_coeff": 1.0, "num_sgd_iter": 10, "lr": 1e-4, "sgd_minibatch_size": 64, "train_batch_size": 2000, "num_workers": 1, "model": {"free_log_std": true}}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v1 \
     --run PPO \
     --stop '{"training_iteration": 2}' \
     --config '{"simple_optimizer": false, "num_sgd_iter": 2, "model": {"use_lstm": true}}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v1 \
     --run PPO \
     --stop '{"training_iteration": 2}' \
     --config '{"simple_optimizer": true, "num_sgd_iter": 2, "model": {"use_lstm": true}}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/train.py \
+    --env CartPole-v1 \
+    --run PPO \
+    --stop '{"training_iteration": 2}' \
+    --config '{"num_gpus": 0.1}' \
+    --ray-num-gpus 1
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v1 \
     --run PPO \
     --stop '{"training_iteration": 2}' \
-    --config '{"kl_coeff": 1.0, "num_sgd_iter": 10, "lr": 1e-4, "sgd_minibatch_size": 64, "train_batch_size": 2000, "num_workers": 1, "use_gae": false}'
+    --config '{"kl_coeff": 1.0, "num_sgd_iter": 10, "lr": 1e-4, "sgd_minibatch_size": 64, "train_batch_size": 2000, "num_workers": 1, "use_gae": false, "batch_mode": "complete_episodes"}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env Pendulum-v0 \
     --run ES \
     --stop '{"training_iteration": 2}' \
     --config '{"stepsize": 0.01, "episodes_per_batch": 20, "train_batch_size": 100, "num_workers": 2}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env Pong-v0 \
     --run ES \
     --stop '{"training_iteration": 2}' \
     --config '{"stepsize": 0.01, "episodes_per_batch": 20, "train_batch_size": 100, "num_workers": 2}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v0 \
     --run A3C \
     --stop '{"training_iteration": 2}' \
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v0 \
     --run DQN \
     --stop '{"training_iteration": 2}' \
     --config '{"lr": 1e-3, "schedule_max_timesteps": 100000, "exploration_fraction": 0.1, "exploration_final_eps": 0.02, "dueling": false, "hiddens": [], "model": {"fcnet_hiddens": [64], "fcnet_activation": "relu"}}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v0 \
     --run DQN \
     --stop '{"training_iteration": 2}' \
     --config '{"num_workers": 2}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v0 \
     --run APEX \
     --stop '{"training_iteration": 2}' \
-    --config '{"num_workers": 2, "timesteps_per_iteration": 1000, "gpu": false, "min_iter_time_s": 1}'
+    --config '{"num_workers": 2, "timesteps_per_iteration": 1000, "num_gpus": 0, "min_iter_time_s": 1}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env FrozenLake-v0 \
     --run DQN \
     --stop '{"training_iteration": 2}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env FrozenLake-v0 \
     --run PPO \
     --stop '{"training_iteration": 2}' \
     --config '{"num_sgd_iter": 10, "sgd_minibatch_size": 64, "train_batch_size": 1000, "num_workers": 1}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env PongDeterministic-v4 \
     --run DQN \
     --stop '{"training_iteration": 2}' \
     --config '{"lr": 1e-4, "schedule_max_timesteps": 2000000, "buffer_size": 10000, "exploration_fraction": 0.1, "exploration_final_eps": 0.01, "sample_batch_size": 4, "learning_starts": 10000, "target_network_update_freq": 1000, "gamma": 0.99, "prioritized_replay": true}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env MontezumaRevenge-v0 \
     --run PPO \
     --stop '{"training_iteration": 2}' \
     --config '{"kl_coeff": 1.0, "num_sgd_iter": 10, "lr": 1e-4, "sgd_minibatch_size": 64, "train_batch_size": 2000, "num_workers": 1, "model": {"dim": 40, "conv_filters": [[16, [8, 8], 4], [32, [4, 4], 2], [512, [5, 5], 1]]}}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v1 \
     --run A3C \
     --stop '{"training_iteration": 2}' \
     --config '{"num_workers": 2, "model": {"use_lstm": true}}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v0 \
     --run DQN \
     --stop '{"training_iteration": 2}' \
     --config '{"num_workers": 2}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v0 \
     --run PG \
     --stop '{"training_iteration": 2}' \
     --config '{"sample_batch_size": 500, "num_workers": 1}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v0 \
     --run PG \
     --stop '{"training_iteration": 2}' \
     --config '{"sample_batch_size": 500, "num_workers": 1, "model": {"use_lstm": true, "max_seq_len": 100}}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v0 \
     --run PG \
     --stop '{"training_iteration": 2}' \
     --config '{"sample_batch_size": 500, "num_workers": 1, "num_envs_per_worker": 10}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env Pong-v0 \
     --run PG \
     --stop '{"training_iteration": 2}' \
     --config '{"sample_batch_size": 500, "num_workers": 1}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env FrozenLake-v0 \
     --run PG \
     --stop '{"training_iteration": 2}' \
     --config '{"sample_batch_size": 500, "num_workers": 1}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env Pendulum-v0 \
     --run DDPG \
     --stop '{"training_iteration": 2}' \
     --config '{"num_workers": 1}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v0 \
     --run IMPALA \
     --stop '{"training_iteration": 2}' \
-    --config '{"gpu": false, "num_workers": 2, "min_iter_time_s": 1}'
+    --config '{"num_gpus": 0, "num_workers": 2, "min_iter_time_s": 1}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v0 \
     --run IMPALA \
     --stop '{"training_iteration": 2}' \
-    --config '{"gpu": false, "num_workers": 2, "min_iter_time_s": 1, "model": {"use_lstm": true}}'
+    --config '{"num_gpus": 0, "num_workers": 2, "min_iter_time_s": 1, "model": {"use_lstm": true}}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/train.py \
+    --env CartPole-v0 \
+    --run IMPALA \
+    --stop '{"training_iteration": 2}' \
+    --config '{"num_gpus": 0, "num_workers": 2, "min_iter_time_s": 1, "num_parallel_data_loaders": 2, "replay_proportion": 1.0}'
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/train.py \
+    --env CartPole-v0 \
+    --run IMPALA \
+    --stop '{"training_iteration": 2}' \
+    --config '{"num_gpus": 0, "num_workers": 2, "min_iter_time_s": 1, "num_parallel_data_loaders": 2, "replay_proportion": 1.0, "model": {"use_lstm": true}}'
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env MountainCarContinuous-v0 \
     --run DDPG \
     --stop '{"training_iteration": 2}' \
     --config '{"num_workers": 1}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     rllib train \
     --env MountainCarContinuous-v0 \
     --run DDPG \
     --stop '{"training_iteration": 2}' \
     --config '{"num_workers": 1}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env Pendulum-v0 \
     --run APEX_DDPG \
@@ -220,113 +245,158 @@ docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
     --stop '{"training_iteration": 2}' \
     --config '{"num_workers": 2, "optimizer": {"num_replay_buffer_shards": 1}, "learning_starts": 100, "min_iter_time_s": 1}'
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
-    sh /ray/test/jenkins_tests/multi_node_tests/test_rllib_eval.sh
-
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/test/test_local.py
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/test/test_checkpoint_restore.py
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/test/test_policy_evaluator.py
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
-    python /ray/python/ray/rllib/test/test_serving_env.py
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/test/test_nested_spaces.py
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/test/test_external_env.py
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/examples/parametric_action_cartpole.py --run=PG --stop=50
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/examples/parametric_action_cartpole.py --run=PPO --stop=50
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/examples/parametric_action_cartpole.py --run=DQN --stop=50
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/test/test_lstm.py
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/examples/batch_norm_model.py --num-iters=1 --run=PPO
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/examples/batch_norm_model.py --num-iters=1 --run=PG
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/examples/batch_norm_model.py --num-iters=1 --run=DQN
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/examples/batch_norm_model.py --num-iters=1 --run=DDPG
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/test/test_multi_agent_env.py
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/test/test_supported_spaces.py
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    pytest /ray/python/ray/tune/test/cluster_tests.py
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/test/test_env_with_subprocess.py
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    /ray/python/ray/rllib/test/test_rollout.sh
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/tune/examples/tune_mnist_ray.py \
     --smoke-test
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/tune/examples/pbt_example.py \
     --smoke-test
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/tune/examples/hyperband_example.py \
     --smoke-test
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/tune/examples/async_hyperband_example.py \
     --smoke-test
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/tune/examples/tune_mnist_ray_hyperband.py \
     --smoke-test
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/tune/examples/tune_mnist_async_hyperband.py \
     --smoke-test
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/tune/examples/hyperopt_example.py \
     --smoke-test
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/tune/examples/tune_mnist_keras.py \
     --smoke-test
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/tune/examples/mnist_pytorch.py \
     --smoke-test
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/tune/examples/mnist_pytorch_trainable.py \
     --smoke-test
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/tune/examples/genetic_example.py \
     --smoke-test
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
-    python /ray/python/ray/rllib/examples/legacy_multiagent/multiagent_mountaincar.py
-
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
-    python /ray/python/ray/rllib/examples/legacy_multiagent/multiagent_pendulum.py
-
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/examples/multiagent_cartpole.py --num-iters=2
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/examples/multiagent_two_trainers.py --num-iters=2
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
-    python /ray/python/ray/rllib/examples/cartpole_lstm.py --stop=200
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/examples/cartpole_lstm.py --run=PPO --stop=200
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/examples/cartpole_lstm.py --run=IMPALA --stop=100
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/examples/cartpole_lstm.py --stop=200 --use-prev-action-reward
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/rllib/examples/custom_metrics_and_callbacks.py --num-iters=2
 
-docker run  -e "RAY_USE_XRAY=1" --rm --shm-size=10G --memory=10G $DOCKER_SHA \
-    python /ray/python/ray/experimental/sgd/test_sgd.py --num-iters=2
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/experimental/sgd/test_sgd.py --num-iters=2 \
+        --batch-size=1 --strategy=simple
 
-# No Xray for PyTorch
-docker run --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/experimental/sgd/test_sgd.py --num-iters=2 \
+        --batch-size=1 --strategy=ps
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/experimental/sgd/mnist_example.py --num-iters=1 \
+        --num-workers=1 --devices-per-worker=1 --strategy=ps
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
+    python /ray/python/ray/experimental/sgd/mnist_example.py --num-iters=1 \
+        --num-workers=1 --devices-per-worker=1 --strategy=ps --tune
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env PongDeterministic-v4 \
     --run A3C \
     --stop '{"training_iteration": 2}' \
-    --config '{"num_workers": 2, "use_pytorch": true, "model": {"use_lstm": false, "grayscale": true, "zero_mean": false, "dim": 84, "channel_major": true}, "preprocessor_pref": "rllib"}'
+    --config '{"num_workers": 2, "use_pytorch": true, "sample_async": false, "model": {"use_lstm": false, "grayscale": true, "zero_mean": false, "dim": 84, "channel_major": true}, "preprocessor_pref": "rllib"}'
 
-# No Xray for PyTorch
-docker run --rm --shm-size=10G --memory=10G $DOCKER_SHA \
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA \
     python /ray/python/ray/rllib/train.py \
     --env CartPole-v1 \
     --run A3C \
     --stop '{"training_iteration": 2}' \
-    --config '{"num_workers": 2, "use_pytorch": true}'
+    --config '{"num_workers": 2, "use_pytorch": true, "sample_async": false}'
+
+docker run --rm --shm-size=${SHM_SIZE} --memory=${MEMORY_SIZE} $DOCKER_SHA python -m pytest /ray/test/object_manager_test.py
 
 python3 $ROOT_DIR/multi_node_docker_test.py \
     --docker-image=$DOCKER_SHA \
     --num-nodes=5 \
     --num-redis-shards=10 \
-    --use-raylet \
     --test-script=/ray/test/jenkins_tests/multi_node_tests/test_0.py
 
 python3 $ROOT_DIR/multi_node_docker_test.py \
@@ -344,7 +414,6 @@ python3 $ROOT_DIR/multi_node_docker_test.py \
     --num-redis-shards=2 \
     --num-gpus=0,0,5,6,50 \
     --num-drivers=100 \
-    --use-raylet \
     --test-script=/ray/test/jenkins_tests/multi_node_tests/many_drivers_test.py
 
 python3 $ROOT_DIR/multi_node_docker_test.py \
@@ -352,5 +421,4 @@ python3 $ROOT_DIR/multi_node_docker_test.py \
     --num-nodes=1 \
     --mem-size=60G \
     --shm-size=60G \
-    --use-raylet \
     --test-script=/ray/test/jenkins_tests/multi_node_tests/large_memory_test.py
diff --git a/test/multi_node_test.py b/test/multi_node_test.py
index 657c03710962d..b25ea8295b314 100644
--- a/test/multi_node_test.py
+++ b/test/multi_node_test.py
@@ -5,49 +5,11 @@
 import os
 import pytest
 import subprocess
-import sys
-import tempfile
 import time
 
 import ray
-from ray.test.test_utils import run_and_get_output
-
-
-def run_string_as_driver(driver_script):
-    """Run a driver as a separate process.
-
-    Args:
-        driver_script: A string to run as a Python script.
-
-    Returns:
-        The script's output.
-    """
-    # Save the driver script as a file so we can call it using subprocess.
-    with tempfile.NamedTemporaryFile() as f:
-        f.write(driver_script.encode("ascii"))
-        f.flush()
-        out = ray.utils.decode(
-            subprocess.check_output([sys.executable, f.name]))
-    return out
-
-
-def run_string_as_driver_nonblocking(driver_script):
-    """Start a driver as a separate process and return immediately.
-
-    Args:
-        driver_script: A string to run as a Python script.
-
-    Returns:
-        A handle to the driver process.
-    """
-    # Save the driver script as a file so we can call it using subprocess. We
-    # do not delete this file because if we do then it may get removed before
-    # the Python process tries to run it.
-    with tempfile.NamedTemporaryFile(delete=False) as f:
-        f.write(driver_script.encode("ascii"))
-        f.flush()
-        return subprocess.Popen(
-            [sys.executable, f.name], stdout=subprocess.PIPE)
+from ray.test.test_utils import (run_and_get_output, run_string_as_driver,
+                                 run_string_as_driver_nonblocking)
 
 
 @pytest.fixture
@@ -239,9 +201,6 @@ def ray_start_head_with_resources():
     subprocess.Popen(["ray", "stop"]).wait()
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") != "1",
-    reason="This test only works with xray.")
 def test_drivers_release_resources(ray_start_head_with_resources):
     redis_address = ray_start_head_with_resources
 
@@ -313,10 +272,6 @@ def test_calling_start_ray_head():
     run_and_get_output(["ray", "start", "--head"])
     subprocess.Popen(["ray", "stop"]).wait()
 
-    # Test starting Ray with a number of workers specified.
-    run_and_get_output(["ray", "start", "--head", "--num-workers", "20"])
-    subprocess.Popen(["ray", "stop"]).wait()
-
     # Test starting Ray with a redis port specified.
     run_and_get_output(["ray", "start", "--head", "--redis-port", "6379"])
     subprocess.Popen(["ray", "stop"]).wait()
@@ -326,9 +281,12 @@ def test_calling_start_ray_head():
         ["ray", "start", "--head", "--node-ip-address", "127.0.0.1"])
     subprocess.Popen(["ray", "stop"]).wait()
 
-    # Test starting Ray with an object manager port specified.
-    run_and_get_output(
-        ["ray", "start", "--head", "--object-manager-port", "12345"])
+    # Test starting Ray with the object manager and node manager ports
+    # specified.
+    run_and_get_output([
+        "ray", "start", "--head", "--object-manager-port", "12345",
+        "--node-manager-port", "54321"
+    ])
     subprocess.Popen(["ray", "stop"]).wait()
 
     # Test starting Ray with the number of CPUs specified.
@@ -353,10 +311,10 @@ def test_calling_start_ray_head():
 
         # Test starting Ray with all arguments specified.
         run_and_get_output([
-            "ray", "start", "--head", "--num-workers", "2", "--redis-port",
-            "6379", "--redis-shard-ports", "6380,6381,6382",
-            "--object-manager-port", "12345", "--num-cpus", "2", "--num-gpus",
-            "0", "--redis-max-clients", "100", "--resources", "{\"Custom\": 1}"
+            "ray", "start", "--head", "--redis-port", "6379",
+            "--redis-shard-ports", "6380,6381,6382", "--object-manager-port",
+            "12345", "--num-cpus", "2", "--num-gpus", "0",
+            "--redis-max-clients", "100", "--resources", "{\"Custom\": 1}"
         ])
         subprocess.Popen(["ray", "stop"]).wait()
 
diff --git a/test/multi_node_test_2.py b/test/multi_node_test_2.py
new file mode 100644
index 0000000000000..04c2c2c55da82
--- /dev/null
+++ b/test/multi_node_test_2.py
@@ -0,0 +1,120 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import json
+import logging
+import pytest
+
+import ray
+import ray.services as services
+from ray.test.cluster_utils import Cluster
+
+logger = logging.getLogger(__name__)
+
+
+@pytest.fixture
+def start_connected_cluster():
+    # Start the Ray processes.
+    g = Cluster(
+        initialize_head=True,
+        connect=True,
+        head_node_args={
+            "resources": dict(CPU=1),
+            "_internal_config": json.dumps({
+                "num_heartbeats_timeout": 10
+            })
+        })
+    yield g
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+    g.shutdown()
+
+
+@pytest.fixture
+def start_connected_longer_cluster():
+    """Creates a cluster with a longer timeout."""
+    g = Cluster(
+        initialize_head=True,
+        connect=True,
+        head_node_args={
+            "resources": dict(CPU=1),
+            "_internal_config": json.dumps({
+                "num_heartbeats_timeout": 20
+            })
+        })
+    yield g
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+    g.shutdown()
+
+
+def test_cluster():
+    """Basic test for adding and removing nodes in cluster."""
+    g = Cluster(initialize_head=False)
+    node = g.add_node()
+    node2 = g.add_node()
+    assert node.all_processes_alive()
+    assert node2.all_processes_alive()
+    g.remove_node(node2)
+    g.remove_node(node)
+    assert not any(n.any_processes_alive() for n in [node, node2])
+
+
+def test_shutdown():
+    g = Cluster(initialize_head=False)
+    node = g.add_node()
+    node2 = g.add_node()
+    g.shutdown()
+    assert not any(n.any_processes_alive() for n in [node, node2])
+
+
+def test_internal_config(start_connected_longer_cluster):
+    """Checks that the internal configuration setting works.
+
+    We set the cluster to timeout nodes after 2 seconds of no timeouts. We
+    then remove a node, wait for 1 second to check that the cluster is out
+    of sync, then wait another 2 seconds (giving 1 second of leeway) to check
+    that the client has timed out.
+    """
+    cluster = start_connected_longer_cluster
+    worker = cluster.add_node()
+    cluster.wait_for_nodes()
+
+    cluster.remove_node(worker)
+    cluster.wait_for_nodes(retries=10)
+    assert ray.global_state.cluster_resources()["CPU"] == 2
+
+    cluster.wait_for_nodes(retries=20)
+    assert ray.global_state.cluster_resources()["CPU"] == 1
+
+
+def test_wait_for_nodes(start_connected_cluster):
+    """Unit test for `Cluster.wait_for_nodes`.
+
+    Adds 4 workers, waits, then removes 4 workers, waits,
+    then adds 1 worker, waits, and removes 1 worker, waits.
+    """
+    cluster = start_connected_cluster
+    workers = [cluster.add_node() for i in range(4)]
+    cluster.wait_for_nodes()
+    [cluster.remove_node(w) for w in workers]
+    cluster.wait_for_nodes()
+
+    assert ray.global_state.cluster_resources()["CPU"] == 1
+    worker2 = cluster.add_node()
+    cluster.wait_for_nodes()
+    cluster.remove_node(worker2)
+    cluster.wait_for_nodes()
+    assert ray.global_state.cluster_resources()["CPU"] == 1
+
+
+def test_worker_plasma_store_failure(start_connected_cluster):
+    cluster = start_connected_cluster
+    worker = cluster.add_node()
+    cluster.wait_for_nodes()
+    # Log monitor doesn't die for some reason
+    worker.kill_log_monitor()
+    worker.kill_plasma_store()
+    worker.process_dict[services.PROCESS_TYPE_RAYLET][0].wait()
+    assert not worker.any_processes_alive(), worker.live_processes()
diff --git a/test/node_manager_test.py b/test/node_manager_test.py
new file mode 100644
index 0000000000000..2f18d7b7308eb
--- /dev/null
+++ b/test/node_manager_test.py
@@ -0,0 +1,63 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import pytest
+
+import ray
+from ray.test.cluster_utils import Cluster
+from ray.test.test_utils import run_string_as_driver
+
+
+@pytest.fixture()
+def ray_start_empty_cluster():
+    cluster = Cluster()
+    yield cluster
+
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+    cluster.shutdown()
+
+
+# This tests the queue transitions for infeasible tasks. This has been an issue
+# in the past, e.g., https://github.com/ray-project/ray/issues/3275.
+def test_infeasible_tasks(ray_start_empty_cluster):
+    cluster = ray_start_empty_cluster
+
+    @ray.remote
+    def f():
+        return
+
+    cluster.add_node(resources={str(0): 100})
+    ray.init(redis_address=cluster.redis_address)
+
+    # Submit an infeasible task.
+    x_id = f._submit(args=[], kwargs={}, resources={str(1): 1})
+
+    # Add a node that makes the task feasible and make sure we can get the
+    # result.
+    cluster.add_node(resources={str(1): 100})
+    ray.get(x_id)
+
+    # Start a driver that submits an infeasible task and then let it exit.
+    driver_script = """
+import ray
+
+ray.init(redis_address="{}")
+
+@ray.remote(resources={})
+def f():
+{}pass  # This is a weird hack to insert some blank space.
+
+f.remote()
+""".format(cluster.redis_address, "{str(2): 1}", "    ")
+
+    run_string_as_driver(driver_script)
+
+    # Now add a new node that makes the task feasible.
+    cluster.add_node(resources={str(2): 100})
+
+    # Make sure we can still run tasks on all nodes.
+    ray.get([
+        f._submit(args=[], kwargs={}, resources={str(i): 1}) for i in range(3)
+    ])
diff --git a/test/object_manager_test.py b/test/object_manager_test.py
new file mode 100644
index 0000000000000..928d0dcd8a092
--- /dev/null
+++ b/test/object_manager_test.py
@@ -0,0 +1,307 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from collections import defaultdict
+import json
+import multiprocessing
+import numpy as np
+import pytest
+import time
+import warnings
+
+import ray
+from ray.test.cluster_utils import Cluster
+
+if (multiprocessing.cpu_count() < 40
+        or ray.utils.get_system_memory() < 50 * 10**9):
+    warnings.warn("This test must be run on large machines.")
+
+
+def create_cluster(num_nodes):
+    cluster = Cluster()
+    for i in range(num_nodes):
+        cluster.add_node(resources={str(i): 100}, object_store_memory=10**9)
+
+    ray.init(redis_address=cluster.redis_address)
+    return cluster
+
+
+@pytest.fixture()
+def ray_start_cluster():
+    num_nodes = 5
+    cluster = create_cluster(num_nodes)
+    yield cluster, num_nodes
+
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+    cluster.shutdown()
+
+
+@pytest.fixture()
+def ray_start_empty_cluster():
+    cluster = Cluster()
+    yield cluster
+
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+    cluster.shutdown()
+
+
+# This test is here to make sure that when we broadcast an object to a bunch of
+# machines, we don't have too many excess object transfers.
+def test_object_broadcast(ray_start_cluster):
+    cluster, num_nodes = ray_start_cluster
+
+    @ray.remote
+    def f(x):
+        return
+
+    x = np.zeros(10**8, dtype=np.uint8)
+
+    @ray.remote
+    def create_object():
+        return np.zeros(10**8, dtype=np.uint8)
+
+    object_ids = []
+
+    for _ in range(3):
+        # Broadcast an object to all machines.
+        x_id = ray.put(x)
+        object_ids.append(x_id)
+        ray.get([
+            f._remote(args=[x_id], resources={str(i % num_nodes): 1})
+            for i in range(10 * num_nodes)
+        ])
+
+    for _ in range(3):
+        # Broadcast an object to all machines.
+        x_id = create_object.remote()
+        object_ids.append(x_id)
+        ray.get([
+            f._remote(args=[x_id], resources={str(i % num_nodes): 1})
+            for i in range(10 * num_nodes)
+        ])
+
+    # Wait for profiling information to be pushed to the profile table.
+    time.sleep(1)
+    transfer_events = ray.global_state.chrome_tracing_object_transfer_dump()
+
+    # Make sure that each object was transferred a reasonable number of times.
+    for x_id in object_ids:
+        relevant_events = [
+            event for event in transfer_events
+            if event["cat"] == "transfer_send"
+            and event["args"][0] == x_id.hex() and event["args"][2] == 1
+        ]
+
+        # NOTE: Each event currently appears twice because we duplicate the
+        # send and receive boxes to underline them with a box (black if it is a
+        # send and gray if it is a receive). So we need to remove these extra
+        # boxes here.
+        deduplicated_relevant_events = [
+            event for event in relevant_events if event["cname"] != "black"
+        ]
+        assert len(deduplicated_relevant_events) * 2 == len(relevant_events)
+        relevant_events = deduplicated_relevant_events
+
+        # Each object must have been broadcast to each remote machine.
+        assert len(relevant_events) >= num_nodes - 1
+        # If more object transfers than necessary have been done, print a
+        # warning.
+        if len(relevant_events) > num_nodes - 1:
+            warnings.warn("This object was transferred {} times, when only {} "
+                          "transfers were required.".format(
+                              len(relevant_events), num_nodes - 1))
+        # Each object should not have been broadcast more than once from every
+        # machine to every other machine. Also, a pair of machines should not
+        # both have sent the object to each other.
+        assert len(relevant_events) <= (num_nodes - 1) * num_nodes / 2
+
+        # Make sure that no object was sent multiple times between the same
+        # pair of object managers.
+        send_counts = defaultdict(int)
+        for event in relevant_events:
+            # The pid identifies the sender and the tid identifies the
+            # receiver.
+            send_counts[(event["pid"], event["tid"])] += 1
+        assert all(value == 1 for value in send_counts.values())
+
+
+# When submitting an actor method, we try to pre-emptively push its arguments
+# to the actor's object manager. However, in the past we did not deduplicate
+# the pushes and so the same object could get shipped to the same object
+# manager many times. This test checks that that isn't happening.
+def test_actor_broadcast(ray_start_cluster):
+    cluster, num_nodes = ray_start_cluster
+
+    @ray.remote
+    class Actor(object):
+        def ready(self):
+            pass
+
+        def set_weights(self, x):
+            pass
+
+    actors = [
+        Actor._remote(args=[], kwargs={}, resources={str(i % num_nodes): 1})
+        for i in range(100)
+    ]
+
+    # Wait for the actors to start up.
+    ray.get([a.ready.remote() for a in actors])
+
+    object_ids = []
+
+    # Broadcast a large object to all actors.
+    for _ in range(10):
+        x_id = ray.put(np.zeros(10**7, dtype=np.uint8))
+        object_ids.append(x_id)
+        # Pass the object into a method for every actor.
+        ray.get([a.set_weights.remote(x_id) for a in actors])
+
+    # Wait for profiling information to be pushed to the profile table.
+    time.sleep(1)
+    transfer_events = ray.global_state.chrome_tracing_object_transfer_dump()
+
+    # Make sure that each object was transferred a reasonable number of times.
+    for x_id in object_ids:
+        relevant_events = [
+            event for event in transfer_events
+            if event["cat"] == "transfer_send"
+            and event["args"][0] == x_id.hex() and event["args"][2] == 1
+        ]
+
+        # NOTE: Each event currently appears twice because we duplicate the
+        # send and receive boxes to underline them with a box (black if it is a
+        # send and gray if it is a receive). So we need to remove these extra
+        # boxes here.
+        deduplicated_relevant_events = [
+            event for event in relevant_events if event["cname"] != "black"
+        ]
+        assert len(deduplicated_relevant_events) * 2 == len(relevant_events)
+        relevant_events = deduplicated_relevant_events
+
+        # Each object must have been broadcast to each remote machine.
+        assert len(relevant_events) >= num_nodes - 1
+        # If more object transfers than necessary have been done, print a
+        # warning.
+        if len(relevant_events) > num_nodes - 1:
+            warnings.warn("This object was transferred {} times, when only {} "
+                          "transfers were required.".format(
+                              len(relevant_events), num_nodes - 1))
+        # Each object should not have been broadcast more than once from every
+        # machine to every other machine. Also, a pair of machines should not
+        # both have sent the object to each other.
+        assert len(relevant_events) <= (num_nodes - 1) * num_nodes / 2
+
+        # Make sure that no object was sent multiple times between the same
+        # pair of object managers.
+        send_counts = defaultdict(int)
+        for event in relevant_events:
+            # The pid identifies the sender and the tid identifies the
+            # receiver.
+            send_counts[(event["pid"], event["tid"])] += 1
+        assert all(value == 1 for value in send_counts.values())
+
+
+# The purpose of this test is to make sure that an object that was already been
+# transferred to a node can be transferred again.
+def test_object_transfer_retry(ray_start_empty_cluster):
+    cluster = ray_start_empty_cluster
+
+    repeated_push_delay = 4
+
+    config = json.dumps({
+        "object_manager_repeated_push_delay_ms": repeated_push_delay * 1000
+    })
+    cluster.add_node(_internal_config=config)
+    cluster.add_node(resources={"GPU": 1}, _internal_config=config)
+    ray.init(redis_address=cluster.redis_address)
+
+    @ray.remote(num_gpus=1)
+    def f(size):
+        return np.zeros(size, dtype=np.uint8)
+
+    x_ids = [f.remote(10**i) for i in [1, 2, 3, 4, 5, 6, 7]]
+    assert not any(
+        ray.worker.global_worker.plasma_client.contains(
+            ray.pyarrow.plasma.ObjectID(x_id.id())) for x_id in x_ids)
+
+    start_time = time.time()
+
+    # Get the objects locally to cause them to be transferred.
+    xs = ray.get(x_ids)
+
+    # Cause all objects to be flushed.
+    del xs
+    x = np.zeros(10**7, dtype=np.uint8)
+    for _ in range(10):
+        ray.put(x)
+    assert not any(
+        ray.worker.global_worker.plasma_client.contains(
+            ray.pyarrow.plasma.ObjectID(x_id.id())) for x_id in x_ids)
+
+    end_time = time.time()
+
+    # Get the objects again and make sure they get transferred.
+    xs = ray.get(x_ids)
+
+    end_transfer_time = time.time()
+
+    # Make sure that the object was retransferred before the object manager
+    # repeated push delay expired.
+    if end_time - start_time <= repeated_push_delay:
+        warnings.warn("This test didn't really fail, but the timing is such "
+                      "that it is not testing the thing it should be testing.")
+    # We should have had to wait for the repeated push delay.
+    assert end_transfer_time - start_time >= repeated_push_delay
+
+    # Flush the objects again and wait longer than the repeated push delay and
+    # make sure that the objects are transferred again.
+    del xs
+    for _ in range(10):
+        ray.put(x)
+    assert not any(
+        ray.worker.global_worker.plasma_client.contains(
+            ray.pyarrow.plasma.ObjectID(x_id.id())) for x_id in x_ids)
+
+    time.sleep(repeated_push_delay)
+    ray.get(x_ids)
+
+
+# The purpose of this test is to make sure we can transfer many objects. In the
+# past, this has caused failures in which object managers create too many open
+# files and run out of resources.
+def test_many_small_transfers(ray_start_cluster):
+    cluster, num_nodes = ray_start_cluster
+
+    @ray.remote
+    def f(*args):
+        pass
+
+    # This function creates 1000 objects on each machine and then transfers
+    # each object to every other machine.
+    def do_transfers():
+        id_lists = []
+        for i in range(num_nodes):
+            id_lists.append([
+                f._remote(args=[], kwargs={}, resources={str(i): 1})
+                for _ in range(1000)
+            ])
+        ids = []
+        for i in range(num_nodes):
+            for j in range(num_nodes):
+                if i == j:
+                    continue
+                ids.append(
+                    f._remote(
+                        args=id_lists[j], kwargs={}, resources={str(i): 1}))
+
+        # Wait for all of the transfers to finish.
+        ray.get(ids)
+
+    do_transfers()
+    do_transfers()
+    do_transfers()
+    do_transfers()
diff --git a/test/runtest.py b/test/runtest.py
index 4ddeb57f84c71..91862023bb5dc 100644
--- a/test/runtest.py
+++ b/test/runtest.py
@@ -2,9 +2,13 @@
 from __future__ import division
 from __future__ import print_function
 
+import json
+import logging
 import os
 import re
+import setproctitle
 import string
+import subprocess
 import sys
 import threading
 import time
@@ -15,8 +19,11 @@
 
 import ray
 import ray.ray_constants as ray_constants
+import ray.test.cluster_utils
 import ray.test.test_utils
 
+logger = logging.getLogger(__name__)
+
 
 def assert_equal(obj1, obj2):
     module_numpy = (type(obj1).__module__ == np.__name__
@@ -292,7 +299,7 @@ def method(self):
             f
 
     f = Foo()
-    with pytest.raises(ray.local_scheduler.common_error):
+    with pytest.raises(ray.raylet.common_error):
         ray.put(f)
 
 
@@ -302,7 +309,7 @@ def test_python_workers(shutdown_only):
     # purposes only.
     num_workers = 4
     ray.worker._init(
-        num_workers=num_workers,
+        num_cpus=num_workers,
         start_workers_from_local_scheduler=False,
         start_ray_local=True)
 
@@ -315,7 +322,7 @@ def f(x):
 
 
 def test_put_get(shutdown_only):
-    ray.init(num_workers=0)
+    ray.init(num_cpus=0)
 
     for i in range(100):
         value_before = i * 10**6
@@ -374,6 +381,23 @@ def f():
     assert ray.get(f.remote()) == ((3, "string1", Bar.__name__), "string2")
 
 
+def test_serialization_final_fallback(ray_start):
+    pytest.importorskip("catboost")
+    # This test will only run when "catboost" is installed.
+    from catboost import CatBoostClassifier
+
+    model = CatBoostClassifier(
+        iterations=2,
+        depth=2,
+        learning_rate=1,
+        loss_function="Logloss",
+        logging_level="Verbose")
+
+    reconstructed_model = ray.get(ray.put(model))
+    assert set(model.get_params().items()) == set(
+        reconstructed_model.get_params().items())
+
+
 def test_register_class(shutdown_only):
     ray.init(num_cpus=2)
 
@@ -678,7 +702,7 @@ def f(x):
         if val == 10:
             break
         else:
-            print("Still using old definition of f, trying again.")
+            logger.info("Still using old definition of f, trying again.")
 
     # Test that we can close over plain old data.
     data = [
@@ -735,18 +759,18 @@ def f(n):
         def g():
             return ray.get_gpu_ids()
 
-        assert f._submit([0], num_return_vals=0) is None
-        id1 = f._submit(args=[1], num_return_vals=1)
+        assert f._remote([0], num_return_vals=0) is None
+        id1 = f._remote(args=[1], num_return_vals=1)
         assert ray.get(id1) == [0]
-        id1, id2 = f._submit(args=[2], num_return_vals=2)
+        id1, id2 = f._remote(args=[2], num_return_vals=2)
         assert ray.get([id1, id2]) == [0, 1]
-        id1, id2, id3 = f._submit(args=[3], num_return_vals=3)
+        id1, id2, id3 = f._remote(args=[3], num_return_vals=3)
         assert ray.get([id1, id2, id3]) == [0, 1, 2]
         assert ray.get(
-            g._submit(
+            g._remote(
                 args=[], num_cpus=1, num_gpus=1,
                 resources={"Custom": 1})) == [0]
-        infeasible_id = g._submit(args=[], resources={"NonexistentCustom": 1})
+        infeasible_id = g._remote(args=[], resources={"NonexistentCustom": 1})
         ready_ids, remaining_ids = ray.wait([infeasible_id], timeout=50)
         assert len(ready_ids) == 0
         assert len(remaining_ids) == 1
@@ -763,10 +787,10 @@ def method(self, a, b=0):
             def gpu_ids(self):
                 return ray.get_gpu_ids()
 
-        a = Actor._submit(
+        a = Actor._remote(
             args=[0], kwargs={"y": 1}, num_gpus=1, resources={"Custom": 1})
 
-        id1, id2, id3, id4 = a.method._submit(
+        id1, id2, id3, id4 = a.method._remote(
             args=["test"], kwargs={"b": 2}, num_return_vals=4)
         assert ray.get([id1, id2, id3, id4]) == [0, 1, "test", 2]
 
@@ -989,57 +1013,6 @@ def get_path2():
     assert "fake_directory" not in ray.get(get_path2.remote())
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray (nor is it intended to).")
-def test_logging_api(shutdown_only):
-    ray.init(num_cpus=1)
-
-    def events():
-        # This is a hack for getting the event log. It is not part of the
-        # API.
-        keys = ray.worker.global_worker.redis_client.keys("event_log:*")
-        res = []
-        for key in keys:
-            res.extend(
-                ray.worker.global_worker.redis_client.zrange(key, 0, -1))
-        return res
-
-    def wait_for_num_events(num_events, timeout=10):
-        start_time = time.time()
-        while time.time() - start_time < timeout:
-            if len(events()) >= num_events:
-                return
-            time.sleep(0.1)
-        print("Timing out of wait.")
-
-    @ray.remote
-    def test_log_span():
-        with ray.profile("event_type2", extra_data={"key": "val"}):
-            pass
-
-    # Make sure that we can call ray.log_span in a remote function.
-    ray.get(test_log_span.remote())
-
-    # Wait for the events to appear in the event log.
-    wait_for_num_events(1)
-    assert len(events()) == 1
-
-    @ray.remote
-    def test_log_span_exception():
-        with ray.log_span("event_type2", extra_data={"key": "val"}):
-            raise Exception("This failed.")
-
-    # Make sure that logging a span works if an exception is thrown.
-    test_log_span_exception.remote()
-    # Wait for the events to appear in the event log.
-    wait_for_num_events(2)
-    assert len(events()) == 2
-
-
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") != "1",
-    reason="This test only works with xray.")
 def test_profiling_api(shutdown_only):
     ray.init(num_cpus=2)
 
@@ -1066,7 +1039,7 @@ def f():
         profile_data = ray.global_state.chrome_tracing_dump()
         event_types = {event["cat"] for event in profile_data}
         expected_types = [
-            "get_task",
+            "worker_idle",
             "task",
             "task:deserialize_arguments",
             "task:execute",
@@ -1086,6 +1059,58 @@ def f():
             break
 
 
+@pytest.fixture()
+def ray_start_cluster():
+    cluster = ray.test.cluster_utils.Cluster()
+    yield cluster
+
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+    cluster.shutdown()
+
+
+def test_object_transfer_dump(ray_start_cluster):
+    cluster = ray_start_cluster
+
+    num_nodes = 3
+    for i in range(num_nodes):
+        cluster.add_node(resources={str(i): 1}, object_store_memory=10**9)
+
+    ray.init(redis_address=cluster.redis_address)
+
+    @ray.remote
+    def f(x):
+        return
+
+    # These objects will live on different nodes.
+    object_ids = [
+        f._remote(args=[1], resources={str(i): 1}) for i in range(num_nodes)
+    ]
+
+    # Broadcast each object from each machine to each other machine.
+    for object_id in object_ids:
+        ray.get([
+            f._remote(args=[object_id], resources={str(i): 1})
+            for i in range(num_nodes)
+        ])
+
+    # The profiling information only flushes once every second.
+    time.sleep(1.1)
+
+    transfer_dump = ray.global_state.chrome_tracing_object_transfer_dump()
+    # Make sure the transfer dump can be serialized with JSON.
+    json.loads(json.dumps(transfer_dump))
+    assert len(transfer_dump) >= num_nodes**2
+    assert len({
+        event["pid"]
+        for event in transfer_dump if event["name"] == "transfer_receive"
+    }) == num_nodes
+    assert len({
+        event["pid"]
+        for event in transfer_dump if event["name"] == "transfer_send"
+    }) == num_nodes
+
+
 def test_identical_function_names(shutdown_only):
     # Define a bunch of remote functions and make sure that we don't
     # accidentally call an older version.
@@ -1166,7 +1191,9 @@ def test_illegal_api_calls(shutdown_only):
 
 
 def test_multithreading(shutdown_only):
-    ray.init(num_cpus=1)
+    # This test requires at least 2 CPUs to finish since the worker does not
+    # relase resources when joining the threads.
+    ray.init(num_cpus=2)
 
     @ray.remote
     def f():
@@ -1191,20 +1218,54 @@ def test_multi_threading():
     def test_multi_threading_in_worker():
         test_multi_threading()
 
+    def block(args, n):
+        ray.wait(args, num_returns=n)
+        ray.get(args[:n])
+
+    @ray.remote
+    class MultithreadedActor(object):
+        def __init__(self):
+            pass
+
+        def spawn(self):
+            objects = [f.remote() for _ in range(1000)]
+            self.threads = [
+                threading.Thread(target=block, args=(objects, n))
+                for n in [1, 5, 10, 100, 1000]
+            ]
+
+            [thread.start() for thread in self.threads]
+
+        def join(self):
+            [thread.join() for thread in self.threads]
+
     # test multi-threading in the driver
     test_multi_threading()
     # test multi-threading in the worker
     ray.get(test_multi_threading_in_worker.remote())
 
+    # test multi-threading in the actor
+    a = MultithreadedActor.remote()
+    ray.get(a.spawn.remote())
+    ray.get(a.join.remote())
+
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") != "1",
-    reason="This test only works with xray.")
 def test_free_objects_multi_node(shutdown_only):
+    # This test will do following:
+    # 1. Create 3 raylets that each hold an actor.
+    # 2. Each actor creates an object which is the deletion target.
+    # 3. Invoke 64 methods on each actor to flush plasma client.
+    # 4. After flushing, the plasma client releases the targets.
+    # 5. Check that the deletion targets have been deleted.
+    # Caution: if remote functions are used instead of actor methods,
+    # one raylet may create more than one worker to execute the
+    # tasks, so the flushing operations may be executed in different
+    # workers and the plasma client holding the deletion target
+    # may not be flushed.
+    config = json.dumps({"object_manager_repeated_push_delay_ms": 1000})
     ray.worker._init(
         start_ray_local=True,
         num_local_schedulers=3,
-        num_workers=1,
         num_cpus=[1, 1, 1],
         resources=[{
             "Custom0": 1
@@ -1213,56 +1274,64 @@ def test_free_objects_multi_node(shutdown_only):
         }, {
             "Custom2": 1
         }],
-        use_raylet=True)
+        _internal_config=config)
 
     @ray.remote(resources={"Custom0": 1})
-    def run_on_0():
-        return ray.worker.global_worker.plasma_client.store_socket_name
+    class ActorOnNode0(object):
+        def get(self):
+            return ray.worker.global_worker.plasma_client.store_socket_name
 
     @ray.remote(resources={"Custom1": 1})
-    def run_on_1():
-        return ray.worker.global_worker.plasma_client.store_socket_name
+    class ActorOnNode1(object):
+        def get(self):
+            return ray.worker.global_worker.plasma_client.store_socket_name
 
     @ray.remote(resources={"Custom2": 1})
-    def run_on_2():
-        return ray.worker.global_worker.plasma_client.store_socket_name
+    class ActorOnNode2(object):
+        def get(self):
+            return ray.worker.global_worker.plasma_client.store_socket_name
 
-    def create():
-        a = run_on_0.remote()
-        b = run_on_1.remote()
-        c = run_on_2.remote()
+    def create(actors):
+        a = actors[0].get.remote()
+        b = actors[1].get.remote()
+        c = actors[2].get.remote()
         (l1, l2) = ray.wait([a, b, c], num_returns=3)
         assert len(l1) == 3
         assert len(l2) == 0
         return (a, b, c)
 
-    def flush():
+    def flush(actors):
         # Flush the Release History.
         # Current Plasma Client Cache will maintain 64-item list.
         # If the number changed, this will fail.
-        print("Start Flush!")
+        logger.info("Start Flush!")
         for i in range(64):
-            ray.get([run_on_0.remote(), run_on_1.remote(), run_on_2.remote()])
-        print("Flush finished!")
+            ray.get([actor.get.remote() for actor in actors])
+        logger.info("Flush finished!")
 
-    def run_one_test(local_only):
-        (a, b, c) = create()
+    def run_one_test(actors, local_only):
+        (a, b, c) = create(actors)
         # The three objects should be generated on different object stores.
         assert ray.get(a) != ray.get(b)
         assert ray.get(a) != ray.get(c)
         assert ray.get(c) != ray.get(b)
         ray.internal.free([a, b, c], local_only=local_only)
-        flush()
+        flush(actors)
         return (a, b, c)
 
+    actors = [
+        ActorOnNode0.remote(),
+        ActorOnNode1.remote(),
+        ActorOnNode2.remote()
+    ]
     # Case 1: run this local_only=False. All 3 objects will be deleted.
-    (a, b, c) = run_one_test(False)
+    (a, b, c) = run_one_test(actors, False)
     (l1, l2) = ray.wait([a, b, c], timeout=10, num_returns=1)
     # All the objects are deleted.
     assert len(l1) == 0
     assert len(l2) == 3
     # Case 2: run this local_only=True. Only 1 object will be deleted.
-    (a, b, c) = run_one_test(True)
+    (a, b, c) = run_one_test(actors, True)
     (l1, l2) = ray.wait([a, b, c], timeout=10, num_returns=3)
     # One object is deleted and 2 objects are not.
     assert len(l1) == 2
@@ -1358,7 +1427,7 @@ def use_actor_handle(handle):
 
 def test_resource_constraints(shutdown_only):
     num_workers = 20
-    ray.init(num_workers=num_workers, num_cpus=10, num_gpus=2)
+    ray.init(num_cpus=10, num_gpus=2)
 
     @ray.remote(num_cpus=0)
     def get_worker_id():
@@ -1434,7 +1503,7 @@ def f(n):
 
 def test_multi_resource_constraints(shutdown_only):
     num_workers = 20
-    ray.init(num_workers=num_workers, num_cpus=10, num_gpus=10)
+    ray.init(num_cpus=10, num_gpus=10)
 
     @ray.remote(num_cpus=0)
     def get_worker_id():
@@ -1638,9 +1707,6 @@ def test(self):
     ray.get(a1.test.remote())
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") != "1",
-    reason="This test only works with xray.")
 def test_zero_cpus(shutdown_only):
     ray.init(num_cpus=0)
 
@@ -1668,9 +1734,6 @@ def method(self):
     assert ray.get(a.method.remote()) != local_plasma
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") != "1",
-    reason="This test only works with xray.")
 def test_fractional_resources(shutdown_only):
     ray.init(num_cpus=6, num_gpus=3, resources={"Custom": 1})
 
@@ -1693,17 +1756,17 @@ def method(self):
             pass
 
     # Create an actor that requires 0.7 of the custom resource.
-    f1 = Foo2._submit([], {}, resources={"Custom": 0.7})
+    f1 = Foo2._remote([], {}, resources={"Custom": 0.7})
     ray.get(f1.method.remote())
     # Make sure that we cannot create an actor that requires 0.7 of the
     # custom resource. TODO(rkn): Re-enable this once ray.wait is
     # implemented.
-    f2 = Foo2._submit([], {}, resources={"Custom": 0.7})
+    f2 = Foo2._remote([], {}, resources={"Custom": 0.7})
     ready, _ = ray.wait([f2.method.remote()], timeout=500)
     assert len(ready) == 0
     # Make sure we can start an actor that requries only 0.3 of the custom
     # resource.
-    f3 = Foo2._submit([], {}, resources={"Custom": 0.3})
+    f3 = Foo2._remote([], {}, resources={"Custom": 0.3})
     ray.get(f3.method.remote())
 
     del f1, f3
@@ -1719,7 +1782,7 @@ def test():
         test.remote()
 
     with pytest.raises(ValueError):
-        Foo2._submit([], {}, resources={"Custom": 1.5})
+        Foo2._remote([], {}, resources={"Custom": 1.5})
 
 
 def test_multiple_local_schedulers(shutdown_only):
@@ -1729,8 +1792,7 @@ def test_multiple_local_schedulers(shutdown_only):
     address_info = ray.worker._init(
         start_ray_local=True,
         num_local_schedulers=3,
-        num_workers=1,
-        num_cpus=[100, 5, 10],
+        num_cpus=[11, 5, 10],
         num_gpus=[0, 5, 1])
 
     # Define a bunch of remote functions that all return the socket name of
@@ -1793,10 +1855,7 @@ def run_lots_of_tasks():
                 results.append(run_on_0_2.remote())
         return names, results
 
-    store_names = [
-        object_store_address.name
-        for object_store_address in address_info["object_store_addresses"]
-    ]
+    store_names = address_info["object_store_addresses"]
 
     def validate_names_and_results(names, results):
         for name, result in zip(names, ray.get(results)):
@@ -2008,20 +2067,6 @@ def g():
     ray.get([g.remote() for _ in range(100)])
 
 
-def test_no_workers(shutdown_only):
-    ray.init(num_cpus=1, num_workers=0)
-
-    @ray.remote
-    def f():
-        return 1
-
-    # Make sure we can call a remote function. This will require starting a
-    # new worker.
-    ray.get(f.remote())
-
-    ray.get([f.remote() for _ in range(100)])
-
-
 def test_blocking_tasks(shutdown_only):
     ray.init(num_cpus=1)
 
@@ -2043,8 +2088,7 @@ def h(i):
         object_ids = [f.remote(i, j) for j in range(2)]
         return ray.wait(object_ids, num_returns=len(object_ids))
 
-    if os.environ.get("RAY_USE_XRAY") == "1":
-        ray.get([h.remote(i) for i in range(4)])
+    ray.get([h.remote(i) for i in range(4)])
 
     @ray.remote
     def _sleep(i):
@@ -2092,7 +2136,7 @@ def attempt_to_load_balance(remote_function,
             [remote_function.remote(*args) for _ in range(total_tasks)])
         names = set(locations)
         counts = [locations.count(name) for name in names]
-        print("Counts are {}.".format(counts))
+        logger.info("Counts are {}.".format(counts))
         if (len(names) == num_local_schedulers
                 and all(count >= minimum_count for count in counts)):
             break
@@ -2123,11 +2167,9 @@ def test_load_balancing_with_dependencies(shutdown_only):
     # This test ensures that tasks are being assigned to all local
     # schedulers in a roughly equal manner even when the tasks have
     # dependencies.
-    num_workers = 3
     num_local_schedulers = 3
     ray.worker._init(
         start_ray_local=True,
-        num_workers=num_workers,
         num_local_schedulers=num_local_schedulers,
         num_cpus=1)
 
@@ -2198,14 +2240,7 @@ def test_global_state_api(shutdown_only):
     task_table = ray.global_state.task_table()
     assert len(task_table) == 1
     assert driver_task_id == list(task_table.keys())[0]
-    if not ray.worker.global_worker.use_raylet:
-        assert (task_table[driver_task_id]["State"] ==
-                ray.experimental.state.TASK_STATUS_RUNNING)
-    if not ray.worker.global_worker.use_raylet:
-        task_spec = task_table[driver_task_id]["TaskSpec"]
-    else:
-        assert len(task_table[driver_task_id]) == 1
-        task_spec = task_table[driver_task_id][0]["TaskSpec"]
+    task_spec = task_table[driver_task_id]["TaskSpec"]
 
     assert task_spec["TaskID"] == driver_task_id
     assert task_spec["ActorID"] == ray_constants.ID_SIZE * "ff"
@@ -2217,15 +2252,8 @@ def test_global_state_api(shutdown_only):
     client_table = ray.global_state.client_table()
     node_ip_address = ray.worker.global_worker.node_ip_address
 
-    if not ray.worker.global_worker.use_raylet:
-        assert len(client_table[node_ip_address]) == 3
-        manager_client = [
-            c for c in client_table[node_ip_address]
-            if c["ClientType"] == "plasma_manager"
-        ][0]
-    else:
-        assert len(client_table) == 1
-        assert client_table[0]["NodeManagerAddress"] == node_ip_address
+    assert len(client_table) == 1
+    assert client_table[0]["NodeManagerAddress"] == node_ip_address
 
     @ray.remote
     def f(*xs):
@@ -2235,25 +2263,15 @@ def f(*xs):
     result_id = f.remote(1, "hi", x_id)
 
     # Wait for one additional task to complete.
-    start_time = time.time()
-    while time.time() - start_time < 10:
-        wait_for_num_tasks(1 + 1)
-        task_table = ray.global_state.task_table()
-        assert len(task_table) == 1 + 1
-        task_id_set = set(task_table.keys())
-        task_id_set.remove(driver_task_id)
-        task_id = list(task_id_set)[0]
-        if ray.worker.global_worker.use_raylet:
-            break
-        if (task_table[task_id]["State"] ==
-                ray.experimental.state.TASK_STATUS_DONE):
-            break
-        time.sleep(0.1)
+    wait_for_num_tasks(1 + 1)
+    task_table = ray.global_state.task_table()
+    assert len(task_table) == 1 + 1
+    task_id_set = set(task_table.keys())
+    task_id_set.remove(driver_task_id)
+    task_id = list(task_id_set)[0]
+
     function_table = ray.global_state.function_table()
-    if not ray.worker.global_worker.use_raylet:
-        task_spec = task_table[task_id]["TaskSpec"]
-    else:
-        task_spec = task_table[task_id][0]["TaskSpec"]
+    task_spec = task_table[task_id]["TaskSpec"]
     assert task_spec["ActorID"] == ray_constants.ID_SIZE * "ff"
     assert task_spec["Args"] == [1, "hi", x_id]
     assert task_spec["DriverID"] == driver_id
@@ -2281,31 +2299,12 @@ def wait_for_object_table():
         raise Exception("Timed out while waiting for object table to "
                         "update.")
 
-    # Wait for the object table to be updated.
-    if not ray.worker.global_worker.use_raylet:
-        wait_for_object_table()
-
     object_table = ray.global_state.object_table()
     assert len(object_table) == 2
 
-    if not ray.worker.global_worker.use_raylet:
-        db_client_id = manager_client["DBClientID"]
-        assert object_table[x_id]["IsPut"] is True
-        assert object_table[x_id]["TaskID"] == driver_task_id
-        assert object_table[x_id]["ManagerIDs"] == [db_client_id]
+    assert object_table[x_id]["IsEviction"][0] is False
 
-        assert object_table[result_id]["IsPut"] is False
-        assert object_table[result_id]["TaskID"] == task_id
-        assert object_table[result_id]["ManagerIDs"] == [db_client_id]
-
-    else:
-        assert len(object_table[x_id]) == 1
-        assert object_table[x_id][0]["IsEviction"] is False
-        assert object_table[x_id][0]["NumEvictions"] == 0
-
-        assert len(object_table[result_id]) == 1
-        assert object_table[result_id][0]["IsEviction"] is False
-        assert object_table[result_id][0]["NumEvictions"] == 0
+    assert object_table[result_id]["IsEviction"][0] is False
 
     assert object_table[x_id] == ray.global_state.object_table(x_id)
     object_table_entry = ray.global_state.object_table(result_id)
@@ -2322,7 +2321,7 @@ def test_log_file_api(shutdown_only):
 
     @ray.remote
     def f():
-        print(message)
+        logger.info(message)
         # The call to sys.stdout.flush() seems to be necessary when using
         # the system Python 2.7 on Ubuntu.
         sys.stdout.flush()
@@ -2346,54 +2345,12 @@ def f():
     assert found_message is True
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_NEW_GCS") == "on",
-    reason="New GCS API doesn't have a Python API yet.")
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray (nor is it intended to).")
-def test_task_profile_api(shutdown_only):
-    ray.init(num_cpus=1, redirect_output=True)
-
-    @ray.remote
-    def f():
-        return 1
-
-    num_calls = 5
-    [f.remote() for _ in range(num_calls)]
-
-    # Make sure the event log has the correct number of events.
-    start_time = time.time()
-    while time.time() - start_time < 10:
-        profiles = ray.global_state.task_profiles(
-            100, start=0, end=time.time())
-        limited_profiles = ray.global_state.task_profiles(
-            1, start=0, end=time.time())
-        if len(profiles) == num_calls and len(limited_profiles) == 1:
-            break
-        time.sleep(0.1)
-    assert len(profiles) == num_calls
-    assert len(limited_profiles) == 1
-
-    # Make sure that each entry is properly formatted.
-    for task_id, data in profiles.items():
-        assert "execute_start" in data
-        assert "execute_end" in data
-        assert "get_arguments_start" in data
-        assert "get_arguments_end" in data
-        assert "store_outputs_start" in data
-        assert "store_outputs_end" in data
-
-
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="New GCS API doesn't have a Python API yet.")
 def test_workers(shutdown_only):
     num_workers = 3
-    ray.init(
-        redirect_worker_output=True,
-        num_cpus=num_workers,
-        num_workers=num_workers)
+    ray.init(redirect_worker_output=True, num_cpus=num_workers)
 
     @ray.remote
     def f():
@@ -2408,146 +2365,136 @@ def f():
     assert len(worker_info) >= num_workers
     for worker_id, info in worker_info.items():
         assert "node_ip_address" in info
-        assert "local_scheduler_socket" in info
-        assert "plasma_manager_socket" in info
         assert "plasma_store_socket" in info
         assert "stderr_file" in info
         assert "stdout_file" in info
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_NEW_GCS") == "on",
-    reason="New GCS API doesn't have a Python API yet.")
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
-def test_dump_trace_file(shutdown_only):
-    ray.init(num_cpus=1, redirect_output=True)
+def test_specific_driver_id():
+    dummy_driver_id = ray.ObjectID(b"00112233445566778899")
+    ray.init(driver_id=dummy_driver_id)
 
     @ray.remote
-    def f(*xs):
-        return 1
+    def f():
+        return ray.worker.global_worker.task_driver_id.id()
 
-    @ray.remote
-    class Foo(object):
-        def __init__(self):
-            pass
+    assert_equal(dummy_driver_id.id(), ray.worker.global_worker.worker_id)
 
-        def method(self):
-            pass
+    task_driver_id = ray.get(f.remote())
+    assert_equal(dummy_driver_id.id(), task_driver_id)
 
-    # We use a number of test objects because objects that are not JSON
-    # serializable caused problems in the past.
-    test_objects = [
-        0, 0.5, "hi", b"hi",
-        ray.put(0),
-        np.zeros(3), [0], (0, ), {
-            0: 0
-        }, True, False, None
-    ]
-    ray.get([f.remote(obj) for obj in test_objects])
-    actors = [Foo.remote() for _ in range(5)]
-    ray.get([actor.method.remote() for actor in actors])
-    ray.get([actor.method.remote() for actor in actors])
+    ray.shutdown()
 
-    path = os.path.join("/tmp/ray_test_trace")
-    task_info = ray.global_state.task_profiles(100, start=0, end=time.time())
-    ray.global_state.dump_catapult_trace(path, task_info)
 
-    # TODO(rkn): This test is not perfect because it does not verify that
-    # the visualization actually renders (e.g., the context of the dumped
-    # trace could be malformed).
+@pytest.fixture
+def shutdown_only_with_initialization_check():
+    yield None
+    # The code after the yield will run as teardown code.
+    ray.shutdown()
+    assert not ray.is_initialized()
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_NEW_GCS") == "on",
-    reason="New GCS API doesn't have a Python API yet.")
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
-def test_flush_api(shutdown_only):
-    ray.init(num_cpus=1)
+def test_initialized(shutdown_only_with_initialization_check):
+    assert not ray.is_initialized()
+    ray.init(num_cpus=0)
+    assert ray.is_initialized()
+
+
+def test_initialized_local_mode(shutdown_only_with_initialization_check):
+    assert not ray.is_initialized()
+    ray.init(num_cpus=0, local_mode=True)
+    assert ray.is_initialized()
+
+
+def test_wait_reconstruction(shutdown_only):
+    ray.init(num_cpus=1, object_store_memory=10**8)
 
     @ray.remote
     def f():
-        return 1
+        return np.zeros(6 * 10**7, dtype=np.uint8)
+
+    x_id = f.remote()
+    ray.wait([x_id])
+    ray.wait([f.remote()])
+    assert not ray.worker.global_worker.plasma_client.contains(
+        ray.pyarrow.plasma.ObjectID(x_id.id()))
+    ready_ids, _ = ray.wait([x_id])
+    assert len(ready_ids) == 1
 
-    [ray.put(1) for _ in range(10)]
-    ray.get([f.remote() for _ in range(10)])
 
-    # Wait until all of the task and object information has been stored in
-    # Redis. Note that since a given key may be updated multiple times
-    # (e.g., multiple calls to TaskTableUpdate), this is an attempt to wait
-    # until all updates have happened. Note that in a real application we
-    # could encounter this kind of issue as well.
-    while True:
-        object_table = ray.global_state.object_table()
-        task_table = ray.global_state.task_table()
+def test_ray_setproctitle(shutdown_only):
+    ray.init(num_cpus=2)
 
-        tables_ready = True
+    @ray.remote
+    class UniqueName(object):
+        def __init__(self):
+            assert setproctitle.getproctitle() == "ray_UniqueName:__init__()"
 
-        if len(object_table) != 20:
-            tables_ready = False
+        def f(self):
+            assert setproctitle.getproctitle() == "ray_UniqueName:f()"
 
-        for object_info in object_table.values():
-            if len(object_info) != 5:
-                tables_ready = False
-            if (object_info["ManagerIDs"] is None
-                    or object_info["DataSize"] == -1
-                    or object_info["Hash"] == ""):
-                tables_ready = False
+    @ray.remote
+    def unique_1():
+        assert setproctitle.getproctitle() == "ray_worker:runtest.unique_1()"
 
-        if len(task_table) != 10 + 1:
-            tables_ready = False
+    actor = UniqueName.remote()
+    ray.get(actor.f.remote())
+    ray.get(unique_1.remote())
 
-        driver_task_id = ray.utils.binary_to_hex(
-            ray.worker.global_worker.current_task_id.id())
 
-        for info in task_table.values():
-            if info["State"] != ray.experimental.state.TASK_STATUS_DONE:
-                if info["TaskSpec"]["TaskID"] != driver_task_id:
-                    tables_ready = False
+def test_duplicate_error_messages(shutdown_only):
+    ray.init(num_cpus=0)
 
-        if tables_ready:
-            break
-        # this test case is blocked sometimes, add this may fix the problem
-        time.sleep(0.1)
+    driver_id = ray.ray_constants.NIL_JOB_ID.id()
+    error_data = ray.gcs_utils.construct_error_message(driver_id, "test",
+                                                       "message", 0)
 
-    # Flush the tables.
-    ray.experimental.flush_redis_unsafe()
-    ray.experimental.flush_task_and_object_metadata_unsafe()
+    # Push the same message to the GCS twice (they are the same because we
+    # do not include a timestamp).
 
-    # Make sure the tables are empty.
-    assert len(ray.global_state.object_table()) == 0
-    assert len(ray.global_state.task_table()) == 0
+    r = ray.worker.global_worker.redis_client
 
-    # Run some more tasks.
-    ray.get([f.remote() for _ in range(10)])
+    r.execute_command("RAY.TABLE_APPEND", ray.gcs_utils.TablePrefix.ERROR_INFO,
+                      ray.gcs_utils.TablePubsub.ERROR_INFO, driver_id,
+                      error_data)
 
-    while len(ray.global_state.task_table()) != 0:
-        time.sleep(0.1)
-        ray.experimental.flush_finished_tasks_unsafe()
+    # Before https://github.com/ray-project/ray/pull/3316 this would
+    # give an error
+    r.execute_command("RAY.TABLE_APPEND", ray.gcs_utils.TablePrefix.ERROR_INFO,
+                      ray.gcs_utils.TablePubsub.ERROR_INFO, driver_id,
+                      error_data)
 
-    # Make sure that we can call this method (but it won't do anything in
-    # this test case).
-    ray.experimental.flush_evicted_objects_unsafe()
 
+@pytest.mark.skipif(
+    os.getenv("TRAVIS") is None,
+    reason="This test should only be run on Travis.")
+def test_ray_stack(shutdown_only):
+    ray.init(num_cpus=2)
 
-@pytest.fixture
-def shutdown_only_with_initialization_check():
-    yield None
-    # The code after the yield will run as teardown code.
-    ray.shutdown()
-    assert not ray.is_initialized()
+    def unique_name_1():
+        time.sleep(1000)
 
+    @ray.remote
+    def unique_name_2():
+        time.sleep(1000)
 
-def test_initialized(shutdown_only_with_initialization_check):
-    assert not ray.is_initialized()
-    ray.init(num_cpus=0)
-    assert ray.is_initialized()
+    @ray.remote
+    def unique_name_3():
+        unique_name_1()
 
+    unique_name_2.remote()
+    unique_name_3.remote()
 
-def test_initialized_local_mode(shutdown_only_with_initialization_check):
-    assert not ray.is_initialized()
-    ray.init(num_cpus=0, local_mode=True)
-    assert ray.is_initialized()
+    success = False
+    start_time = time.time()
+    while time.time() - start_time < 30:
+        # Attempt to parse the "ray stack" call.
+        output = ray.utils.decode(subprocess.check_output(["ray", "stack"]))
+        if ("unique_name_1" in output and "unique_name_2" in output
+                and "unique_name_3" in output):
+            success = True
+            break
+
+    if not success:
+        raise Exception("Failed to find necessary information with "
+                        "'ray stack'")
diff --git a/test/stress_tests.py b/test/stress_tests.py
index 6cea02d820283..3d4b0fb363e13 100644
--- a/test/stress_tests.py
+++ b/test/stress_tests.py
@@ -2,12 +2,14 @@
 from __future__ import division
 from __future__ import print_function
 
+import json
 import numpy as np
 import os
 import pytest
 import time
 
 import ray
+import ray.tempfile_services
 import ray.ray_constants as ray_constants
 
 
@@ -36,7 +38,6 @@ def ray_start_combination(request):
     # Start the Ray processes.
     ray.worker._init(
         start_ray_local=True,
-        num_workers=num_workers_per_scheduler,
         num_local_schedulers=num_local_schedulers,
         num_cpus=10)
     yield num_local_schedulers, num_workers_per_scheduler
@@ -102,6 +103,30 @@ def g(n):
     assert ray.services.all_processes_alive()
 
 
+def test_submitting_many_actors_to_one(ray_start_sharded):
+    @ray.remote
+    class Actor(object):
+        def __init__(self):
+            pass
+
+        def ping(self):
+            return
+
+    @ray.remote
+    class Worker(object):
+        def __init__(self, actor):
+            self.actor = actor
+
+        def ping(self):
+            return ray.get(self.actor.ping.remote())
+
+    a = Actor.remote()
+    workers = [Worker.remote(a) for _ in range(100)]
+    for _ in range(10):
+        out = ray.get([w.ping.remote() for w in workers])
+        assert out == [None for _ in workers]
+
+
 def test_getting_and_putting(ray_start_sharded):
     for n in range(8):
         x = np.zeros(10**n)
@@ -161,9 +186,7 @@ def ray_start_reconstruction(request):
 
     # Start the Redis global state store.
     node_ip_address = "127.0.0.1"
-    use_raylet = os.environ.get("RAY_USE_XRAY") == "1"
-    redis_address, redis_shards = ray.services.start_redis(
-        node_ip_address, use_raylet=use_raylet)
+    redis_address, redis_shards = ray.services.start_redis(node_ip_address)
     redis_ip_address = ray.services.get_ip_address(redis_address)
     redis_port = ray.services.get_port(redis_address)
     time.sleep(0.1)
@@ -171,21 +194,17 @@ def ray_start_reconstruction(request):
     # Start the Plasma store instances with a total of 1GB memory.
     plasma_store_memory = 10**9
     plasma_addresses = []
-    objstore_memory = plasma_store_memory // num_local_schedulers
+    object_store_memory = plasma_store_memory // num_local_schedulers
     for i in range(num_local_schedulers):
-        store_stdout_file, store_stderr_file = ray.services.new_log_files(
-            "plasma_store_{}".format(i), True)
-        manager_stdout_file, manager_stderr_file = (ray.services.new_log_files(
-            "plasma_manager_{}".format(i), True))
+        store_stdout_file, store_stderr_file = (
+            ray.tempfile_services.new_plasma_store_log_file(i, True))
         plasma_addresses.append(
             ray.services.start_plasma_store(
                 node_ip_address,
                 redis_address,
-                objstore_memory=objstore_memory,
+                object_store_memory=object_store_memory,
                 store_stdout_file=store_stdout_file,
-                store_stderr_file=store_stderr_file,
-                manager_stdout_file=manager_stdout_file,
-                manager_stderr_file=manager_stderr_file))
+                store_stderr_file=store_stderr_file))
 
     # Start the rest of the services in the Ray cluster.
     address_info = {
@@ -196,10 +215,12 @@ def ray_start_reconstruction(request):
     ray.worker._init(
         address_info=address_info,
         start_ray_local=True,
-        num_workers=1,
         num_local_schedulers=num_local_schedulers,
         num_cpus=[1] * num_local_schedulers,
-        redirect_output=True)
+        redirect_output=True,
+        _internal_config=json.dumps({
+            "initial_reconstruction_timeout_milliseconds": 200
+        }))
 
     yield (redis_ip_address, redis_port, plasma_store_memory,
            num_local_schedulers)
@@ -399,9 +420,7 @@ def wait_for_errors(error_check):
     return errors
 
 
-@pytest.mark.skipif(
-    os.environ.get("RAY_USE_XRAY") == "1",
-    reason="This test does not work with xray yet.")
+@pytest.mark.skip("This test does not work yet.")
 @pytest.mark.skipif(
     os.environ.get("RAY_USE_NEW_GCS") == "on",
     reason="Failing with new GCS API on Linux.")
@@ -516,7 +535,7 @@ def single_dependency(i, arg):
     # were evicted and whose originating tasks are still running, this
     # for-loop should hang on its first iteration and push an error to the
     # driver.
-    ray.worker.global_worker.local_scheduler_client.reconstruct_objects(
+    ray.worker.global_worker.local_scheduler_client.fetch_or_reconstruct(
         [args[0]], False)
 
     def error_check(errors):
diff --git a/test/stress_tests/run_stress_tests.sh b/test/stress_tests/run_stress_tests.sh
new file mode 100755
index 0000000000000..ba0886037c9e0
--- /dev/null
+++ b/test/stress_tests/run_stress_tests.sh
@@ -0,0 +1,19 @@
+#!/usr/bin/env bash
+
+# Cause the script to exit if a single command fails.
+set -e
+
+# Show explicitly which commands are currently running.
+set -x
+
+ROOT_DIR=$(cd "$(dirname "${BASH_SOURCE:-$0}")"; pwd)
+
+# Start a large cluster using the autoscaler.
+ray up -y $ROOT_DIR/stress_testing_config.yaml
+
+# Run a bunch of stress tests.
+ray submit $ROOT_DIR/stress_testing_config.yaml test_many_tasks_and_transfers.py
+ray submit $ROOT_DIR/stress_testing_config.yaml test_dead_actors.py
+
+# Tear down the cluster.
+ray down -y $ROOT_DIR/stress_testing_config.yaml
diff --git a/test/stress_tests/stress_testing_config.yaml b/test/stress_tests/stress_testing_config.yaml
new file mode 100644
index 0000000000000..6ef5285035e82
--- /dev/null
+++ b/test/stress_tests/stress_testing_config.yaml
@@ -0,0 +1,115 @@
+# An unique identifier for the head node and workers of this cluster.
+cluster_name: stress-testing
+
+# The minimum number of workers nodes to launch in addition to the head
+# node. This number should be >= 0.
+min_workers: 100
+
+# The maximum number of workers nodes to launch in addition to the head
+# node. This takes precedence over min_workers.
+max_workers: 100
+
+# The autoscaler will scale up the cluster to this target fraction of resource
+# usage. For example, if a cluster of 10 nodes is 100% busy and
+# target_utilization is 0.8, it would resize the cluster to 13. This fraction
+# can be decreased to increase the aggressiveness of upscaling.
+# This value must be less than 1.0 for scaling to happen.
+target_utilization_fraction: 0.8
+
+# If a node is idle for this many minutes, it will be removed.
+idle_timeout_minutes: 5
+
+# Cloud-provider specific configuration.
+provider:
+    type: aws
+    region: us-west-2
+    availability_zone: us-west-2a
+
+# How Ray will authenticate with newly launched nodes.
+auth:
+    ssh_user: ubuntu
+# By default Ray creates a new private keypair, but you can also use your own.
+# If you do so, make sure to also set "KeyName" in the head and worker node
+# configurations below.
+#    ssh_private_key: /path/to/your/key.pem
+
+# Provider-specific config for the head node, e.g. instance type. By default
+# Ray will auto-configure unspecified fields such as SubnetId and KeyName.
+# For more documentation on available fields, see:
+# http://boto3.readthedocs.io/en/latest/reference/services/ec2.html#EC2.ServiceResource.create_instances
+head_node:
+    InstanceType: m5.12xlarge
+    ImageId: ami-0def3275  # Default Ubuntu 16.04 AMI.
+
+    # Set primary volume to 25 GiB
+    BlockDeviceMappings:
+        - DeviceName: /dev/sda1
+          Ebs:
+              VolumeSize: 50
+
+    # Additional options in the boto docs.
+
+# Provider-specific config for worker nodes, e.g. instance type. By default
+# Ray will auto-configure unspecified fields such as SubnetId and KeyName.
+# For more documentation on available fields, see:
+# http://boto3.readthedocs.io/en/latest/reference/services/ec2.html#EC2.ServiceResource.create_instances
+worker_nodes:
+    InstanceType: m5.large
+    ImageId: ami-0def3275  # Default Ubuntu 16.04 AMI.
+
+    # Set primary volume to 25 GiB
+    BlockDeviceMappings:
+        - DeviceName: /dev/sda1
+          Ebs:
+              VolumeSize: 50
+
+    # Run workers on spot by default. Comment this out to use on-demand.
+    InstanceMarketOptions:
+        MarketType: spot
+        # Additional options can be found in the boto docs, e.g.
+        #   SpotOptions:
+        #       MaxPrice: MAX_HOURLY_PRICE
+
+    # Additional options in the boto docs.
+
+# Files or directories to copy to the head and worker nodes. The format is a
+# dictionary from REMOTE_PATH: LOCAL_PATH, e.g.
+file_mounts: {
+#    "/path1/on/remote/machine": "/path1/on/local/machine",
+#    "/path2/on/remote/machine": "/path2/on/local/machine",
+}
+
+# List of shell commands to run to set up nodes.
+setup_commands:
+    # Consider uncommenting these if you run into dpkg locking issues
+    # - sudo pkill -9 apt-get || true
+    # - sudo pkill -9 dpkg || true
+    # - sudo dpkg --configure -a
+    # Install basics.
+    - sudo apt-get update
+    - sudo apt-get install -y cmake pkg-config build-essential autoconf curl libtool unzip flex bison python
+    # Install Anaconda.
+    - wget https://repo.continuum.io/archive/Anaconda3-5.0.1-Linux-x86_64.sh || true
+    - bash Anaconda3-5.0.1-Linux-x86_64.sh -b -p $HOME/anaconda3 || true
+    - echo 'export PATH="$HOME/anaconda3/bin:$PATH"' >> ~/.bashrc
+    # # Build Ray.
+    # - git clone https://github.com/ray-project/ray || true
+    - pip install boto3==1.4.8 cython==0.27.3
+    # - cd ray/python; git checkout master; git pull; pip install -e . --verbose
+    - pip install https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-0.6.0-cp36-cp36m-manylinux1_x86_64.whl
+
+# Custom commands that will be run on the head node after common setup.
+head_setup_commands: []
+
+# Custom commands that will be run on worker nodes after common setup.
+worker_setup_commands: []
+
+# Command to start ray on the head node. You don't need to change this.
+head_start_ray_commands:
+    - ray stop
+    - ulimit -n 65536; ray start --head --num-redis-shards=5 --redis-port=6379 --autoscaling-config=~/ray_bootstrap_config.yaml
+
+# Command to start ray on worker nodes. You don't need to change this.
+worker_start_ray_commands:
+    - ray stop
+    - ulimit -n 65536; ray start --redis-address=$RAY_HEAD_IP:6379 --num-gpus=100
diff --git a/test/stress_tests/test_dead_actors.py b/test/stress_tests/test_dead_actors.py
new file mode 100644
index 0000000000000..72b8011426358
--- /dev/null
+++ b/test/stress_tests/test_dead_actors.py
@@ -0,0 +1,72 @@
+#!/usr/bin/env python
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import logging
+import numpy as np
+import sys
+
+import ray
+
+logger = logging.getLogger(__name__)
+
+ray.init(redis_address="localhost:6379")
+
+
+@ray.remote
+class Child(object):
+    def __init__(self, death_probability):
+        self.death_probability = death_probability
+
+    def ping(self):
+        # Exit process with some probability.
+        exit_chance = np.random.rand()
+        if exit_chance > self.death_probability:
+            sys.exit(-1)
+
+
+@ray.remote
+class Parent(object):
+    def __init__(self, num_children, death_probability):
+        self.death_probability = death_probability
+        self.children = [
+            Child.remote(death_probability) for _ in range(num_children)
+        ]
+
+    def ping(self, num_pings):
+        children_outputs = []
+        for _ in range(num_pings):
+            children_outputs += [
+                child.ping.remote() for child in self.children
+            ]
+        try:
+            ray.get(children_outputs)
+        except Exception:
+            # Replace the children if one of them died.
+            self.__init__(len(self.children), self.death_probability)
+
+    def kill(self):
+        # Clean up children.
+        ray.get([child.__ray_terminate__.remote() for child in self.children])
+
+
+num_parents = 10
+num_children = 10
+death_probability = 0.95
+
+parents = [
+    Parent.remote(num_children, death_probability) for _ in range(num_parents)
+]
+for i in range(100):
+    ray.get([parent.ping.remote(10) for parent in parents])
+
+    # Kill a parent actor with some probability.
+    exit_chance = np.random.rand()
+    if exit_chance > death_probability:
+        parent_index = np.random.randint(len(parents))
+        parents[parent_index].kill.remote()
+        parents[parent_index] = Parent.remote(num_children, death_probability)
+
+    logger.info("Finished trial", i)
diff --git a/test/stress_tests/test_many_tasks_and_transfers.py b/test/stress_tests/test_many_tasks_and_transfers.py
new file mode 100644
index 0000000000000..87b8239a08fe9
--- /dev/null
+++ b/test/stress_tests/test_many_tasks_and_transfers.py
@@ -0,0 +1,84 @@
+#!/usr/bin/env python
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import numpy as np
+import logging
+import time
+
+import ray
+
+logger = logging.getLogger(__name__)
+
+ray.init(redis_address="localhost:6379")
+
+# These numbers need to match the values in the autoscaler config file.
+num_remote_nodes = 100
+head_node_cpus = 2
+num_remote_cpus = num_remote_nodes * head_node_cpus
+
+# Wait until the expected number of nodes have joined the cluster.
+while True:
+    if len(ray.global_state.client_table()) >= num_remote_nodes + 1:
+        break
+logger.info("Nodes have all joined. There are {} resources."
+            .format(ray.global_state.cluster_resources()))
+
+
+# Require 1 GPU to force the tasks to be on remote machines.
+@ray.remote(num_gpus=1)
+def f(size, *xs):
+    return np.ones(size, dtype=np.uint8)
+
+
+# Require 1 GPU to force the actors to be on remote machines.
+@ray.remote(num_cpus=1, num_gpus=1)
+class Actor(object):
+    def method(self, size, *xs):
+        return np.ones(size, dtype=np.uint8)
+
+
+# Launch a bunch of tasks.
+start_time = time.time()
+logger.info("Submitting many tasks.")
+for i in range(10):
+    logger.info("Iteration {}".format(i))
+    ray.get([f.remote(0) for _ in range(100000)])
+logger.info("Finished after {} seconds.".format(time.time() - start_time))
+
+# Launch a bunch of tasks, each with a bunch of dependencies.
+start_time = time.time()
+logger.info("Submitting tasks with many dependencies.")
+x_ids = []
+for i in range(5):
+    logger.info("Iteration {}".format(i))
+    x_ids = [f.remote(0, *x_ids) for _ in range(10000)]
+ray.get(x_ids)
+logger.info("Finished after {} seconds.".format(time.time() - start_time))
+
+# Create a bunch of actors.
+start_time = time.time()
+logger.info("Creating {} actors.".format(num_remote_cpus))
+actors = [Actor.remote() for _ in range(num_remote_cpus)]
+logger.info("Finished after {} seconds.".format(time.time() - start_time))
+
+# Submit a bunch of small tasks to each actor.
+start_time = time.time()
+logger.info("Submitting many small actor tasks.")
+x_ids = []
+for _ in range(100000):
+    x_ids = [a.method.remote(0) for a in actors]
+ray.get(x_ids)
+logger.info("Finished after {} seconds.".format(time.time() - start_time))
+
+# Submit a bunch of actor tasks with all-to-all communication.
+start_time = time.time()
+logger.info("Submitting actor tasks with all-to-all communication.")
+x_ids = []
+for _ in range(50):
+    for size_exponent in [0, 1, 2, 3, 4, 5, 6]:
+        x_ids = [a.method.remote(10**size_exponent, *x_ids) for a in actors]
+ray.get(x_ids)
+logger.info("Finished after {} seconds.".format(time.time() - start_time))
diff --git a/test/tempfile_test.py b/test/tempfile_test.py
new file mode 100644
index 0000000000000..d8fbb07dc89e4
--- /dev/null
+++ b/test/tempfile_test.py
@@ -0,0 +1,114 @@
+import os
+import shutil
+import time
+import pytest
+import ray
+import ray.tempfile_services as tempfile_services
+
+
+def test_conn_cluster():
+    # plasma_store_socket_name
+    with pytest.raises(Exception) as exc_info:
+        ray.init(
+            redis_address="127.0.0.1:6379",
+            plasma_store_socket_name="/tmp/this_should_fail")
+    assert exc_info.value.args[0] == (
+        "When connecting to an existing cluster, "
+        "plasma_store_socket_name must not be provided.")
+
+    # raylet_socket_name
+    with pytest.raises(Exception) as exc_info:
+        ray.init(
+            redis_address="127.0.0.1:6379",
+            raylet_socket_name="/tmp/this_should_fail")
+    assert exc_info.value.args[0] == (
+        "When connecting to an existing cluster, "
+        "raylet_socket_name must not be provided.")
+
+    # temp_dir
+    with pytest.raises(Exception) as exc_info:
+        ray.init(
+            redis_address="127.0.0.1:6379", temp_dir="/tmp/this_should_fail")
+    assert exc_info.value.args[0] == (
+        "When connecting to an existing cluster, "
+        "temp_dir must not be provided.")
+
+
+def test_tempdir():
+    ray.init(temp_dir="/tmp/i_am_a_temp_dir")
+    assert os.path.exists(
+        "/tmp/i_am_a_temp_dir"), "Specified temp dir not found."
+    ray.shutdown()
+    shutil.rmtree("/tmp/i_am_a_temp_dir", ignore_errors=True)
+
+
+def test_raylet_socket_name():
+    ray.init(raylet_socket_name="/tmp/i_am_a_temp_socket")
+    assert os.path.exists(
+        "/tmp/i_am_a_temp_socket"), "Specified socket path not found."
+    ray.shutdown()
+    try:
+        os.remove("/tmp/i_am_a_temp_socket")
+    except Exception:
+        pass
+
+
+def test_temp_plasma_store_socket():
+    ray.init(plasma_store_socket_name="/tmp/i_am_a_temp_socket")
+    assert os.path.exists(
+        "/tmp/i_am_a_temp_socket"), "Specified socket path not found."
+    ray.shutdown()
+    try:
+        os.remove("/tmp/i_am_a_temp_socket")
+    except Exception:
+        pass
+
+
+def test_raylet_tempfiles():
+    ray.init(redirect_worker_output=False)
+    top_levels = set(os.listdir(tempfile_services.get_temp_root()))
+    assert top_levels == {"ray_ui.ipynb", "sockets", "logs"}
+    log_files = set(os.listdir(tempfile_services.get_logs_dir_path()))
+    assert log_files == {
+        "log_monitor.out", "log_monitor.err", "plasma_store_0.out",
+        "plasma_store_0.err", "webui.out", "webui.err", "monitor.out",
+        "monitor.err", "redis-shard_0.out", "redis-shard_0.err", "redis.out",
+        "redis.err"
+    }  # without raylet logs
+    socket_files = set(os.listdir(tempfile_services.get_sockets_dir_path()))
+    assert socket_files == {"plasma_store", "raylet"}
+    ray.shutdown()
+
+    ray.init(redirect_worker_output=True, num_cpus=0)
+    top_levels = set(os.listdir(tempfile_services.get_temp_root()))
+    assert top_levels == {"ray_ui.ipynb", "sockets", "logs"}
+    log_files = set(os.listdir(tempfile_services.get_logs_dir_path()))
+    assert log_files == {
+        "log_monitor.out", "log_monitor.err", "plasma_store_0.out",
+        "plasma_store_0.err", "webui.out", "webui.err", "monitor.out",
+        "monitor.err", "redis-shard_0.out", "redis-shard_0.err", "redis.out",
+        "redis.err", "raylet_0.out", "raylet_0.err"
+    }  # with raylet logs
+    socket_files = set(os.listdir(tempfile_services.get_sockets_dir_path()))
+    assert socket_files == {"plasma_store", "raylet"}
+    ray.shutdown()
+
+    ray.init(redirect_worker_output=True, num_cpus=2)
+    top_levels = set(os.listdir(tempfile_services.get_temp_root()))
+    assert top_levels == {"ray_ui.ipynb", "sockets", "logs"}
+    time.sleep(3)  # wait workers to start
+    log_files = set(os.listdir(tempfile_services.get_logs_dir_path()))
+    assert log_files.issuperset({
+        "log_monitor.out", "log_monitor.err", "plasma_store_0.out",
+        "plasma_store_0.err", "webui.out", "webui.err", "monitor.out",
+        "monitor.err", "redis-shard_0.out", "redis-shard_0.err", "redis.out",
+        "redis.err", "raylet_0.out", "raylet_0.err"
+    })  # with raylet logs
+
+    # Check numbers of worker log file.
+    assert sum(
+        1 for filename in log_files if filename.startswith("worker")) == 4
+
+    socket_files = set(os.listdir(tempfile_services.get_sockets_dir_path()))
+    assert socket_files == {"plasma_store", "raylet"}
+    ray.shutdown()
diff --git a/test/xray_test.py b/test/xray_test.py
index 13c9f2c174e7b..cc4c5a03978c7 100644
--- a/test/xray_test.py
+++ b/test/xray_test.py
@@ -11,7 +11,7 @@
 @pytest.fixture
 def ray_start():
     # Start the Ray processes.
-    ray.init(num_cpus=1, use_raylet=True)
+    ray.init(num_cpus=1)
     yield None
     # The code after the yield will run as teardown code.
     ray.shutdown()
diff --git a/thirdparty/scripts/build_modin.sh b/thirdparty/scripts/build_modin.sh
new file mode 100755
index 0000000000000..96563fdb21067
--- /dev/null
+++ b/thirdparty/scripts/build_modin.sh
@@ -0,0 +1,29 @@
+#!/bin/bash
+
+set -x
+
+# Cause the script to exit if a single command fails.
+set -e
+
+if [[ -z  "$1" ]]; then
+  PYTHON_EXECUTABLE=`which python`
+else
+  PYTHON_EXECUTABLE=$1
+fi
+
+PYTHON_VERSION="$($PYTHON_EXECUTABLE -c 'import sys; print(sys.version_info[0])')"
+
+TP_DIR=$(cd "$(dirname "${BASH_SOURCE:-$0}")"; pwd)/../
+MODIN_VERSION=0.2.4
+MODIN_WHEELS_FNAME="modin-$MODIN_VERSION-py$PYTHON_VERSION-none-any.whl"
+MODIN_WHEELS_URL="https://github.com/modin-project/modin/releases/download/v$MODIN_VERSION/"
+
+pushd $TP_DIR/../python/ray/
+rm -rf modin
+mkdir modin
+pushd modin
+curl -kL "$MODIN_WHEELS_URL$MODIN_WHEELS_FNAME" -o "$MODIN_WHEELS_FNAME"
+unzip "$MODIN_WHEELS_FNAME"
+rm "$MODIN_WHEELS_FNAME"
+popd
+popd
diff --git a/thirdparty/scripts/setup.sh b/thirdparty/scripts/setup.sh
index 27f1ef0e3ed51..da283bd3b2bb7 100755
--- a/thirdparty/scripts/setup.sh
+++ b/thirdparty/scripts/setup.sh
@@ -67,3 +67,8 @@ bash "$TP_SCRIPT_DIR/build_ui.sh"
 # rDSN (optional)
 ##############################################
 # bash "$TP_SCRIPT_DIR/build_rdsn.sh"
+
+##############################################
+# modin
+##############################################
+bash "$TP_SCRIPT_DIR/build_modin.sh" $PYTHON_EXECUTABLE