diff --git a/doc/source/ray-air/examples/BUILD b/doc/source/ray-air/examples/BUILD
index 37895a1d851f..1beb742e708b 100644
--- a/doc/source/ray-air/examples/BUILD
+++ b/doc/source/ray-air/examples/BUILD
@@ -31,9 +31,7 @@ py_test_run_all_notebooks(
     include = ["*.ipynb"],
     exclude = [
         "huggingface_text_classification.ipynb",
-        "torch_incremental_learning.ipynb",
         "feast_example.ipynb",  # REGRESSION
-        "tfx_tabular_train_to_serve.ipynb", # REGRESSION
     ],
     data = ["//doc/source/ray-air/examples:air_examples"],
     tags = ["exclusive", "team:ml", "ray_air"],
diff --git a/doc/source/ray-air/examples/tfx_tabular_train_to_serve.ipynb b/doc/source/ray-air/examples/tfx_tabular_train_to_serve.ipynb
index 78b43111b761..ece0a92d89cc 100644
--- a/doc/source/ray-air/examples/tfx_tabular_train_to_serve.ipynb
+++ b/doc/source/ray-air/examples/tfx_tabular_train_to_serve.ipynb
@@ -31,7 +31,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/"
@@ -65,7 +65,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 2,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/"
@@ -73,7 +73,68 @@
     "id": "MOsHUjgdIrIW",
     "outputId": "8a21ead5-bb2d-4a3d-ae41-17a313688b24"
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "2022-07-20 18:45:28,814\tINFO services.py:1483 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8266\u001b[39m\u001b[22m\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "    <div style=\"margin-left: 50px;display: flex;flex-direction: row;align-items: center\">\n",
+       "        <h3 style=\"color: var(--jp-ui-font-color0)\">Ray</h3>\n",
+       "        <svg version=\"1.1\" id=\"ray\" width=\"3em\" viewBox=\"0 0 144.5 144.6\" style=\"margin-left: 3em;margin-right: 3em\">\n",
+       "            <g id=\"layer-1\">\n",
+       "                <path fill=\"#00a2e9\" class=\"st0\" d=\"M97.3,77.2c-3.8-1.1-6.2,0.9-8.3,5.1c-3.5,6.8-9.9,9.9-17.4,9.6S58,88.1,54.8,81.2c-1.4-3-3-4-6.3-4.1\n",
+       "                    c-5.6-0.1-9.9,0.1-13.1,6.4c-3.8,7.6-13.6,10.2-21.8,7.6C5.2,88.4-0.4,80.5,0,71.7c0.1-8.4,5.7-15.8,13.8-18.2\n",
+       "                    c8.4-2.6,17.5,0.7,22.3,8c1.3,1.9,1.3,5.2,3.6,5.6c3.9,0.6,8,0.2,12,0.2c1.8,0,1.9-1.6,2.4-2.8c3.5-7.8,9.7-11.8,18-11.9\n",
+       "                    c8.2-0.1,14.4,3.9,17.8,11.4c1.3,2.8,2.9,3.6,5.7,3.3c1-0.1,2,0.1,3,0c2.8-0.5,6.4,1.7,8.1-2.7s-2.3-5.5-4.1-7.5\n",
+       "                    c-5.1-5.7-10.9-10.8-16.1-16.3C84,38,81.9,37.1,78,38.3C66.7,42,56.2,35.7,53,24.1C50.3,14,57.3,2.8,67.7,0.5\n",
+       "                    C78.4-2,89,4.7,91.5,15.3c0.1,0.3,0.1,0.5,0.2,0.8c0.7,3.4,0.7,6.9-0.8,9.8c-1.7,3.2-0.8,5,1.5,7.2c6.7,6.5,13.3,13,19.8,19.7\n",
+       "                    c1.8,1.8,3,2.1,5.5,1.2c9.1-3.4,17.9-0.6,23.4,7c4.8,6.9,4.6,16.1-0.4,22.9c-5.4,7.2-14.2,9.9-23.1,6.5c-2.3-0.9-3.5-0.6-5.1,1.1\n",
+       "                    c-6.7,6.9-13.6,13.7-20.5,20.4c-1.8,1.8-2.5,3.2-1.4,5.9c3.5,8.7,0.3,18.6-7.7,23.6c-7.9,5-18.2,3.8-24.8-2.9\n",
+       "                    c-6.4-6.4-7.4-16.2-2.5-24.3c4.9-7.8,14.5-11,23.1-7.8c3,1.1,4.7,0.5,6.9-1.7C91.7,98.4,98,92.3,104.2,86c1.6-1.6,4.1-2.7,2.6-6.2\n",
+       "                    c-1.4-3.3-3.8-2.5-6.2-2.6C99.8,77.2,98.9,77.2,97.3,77.2z M72.1,29.7c5.5,0.1,9.9-4.3,10-9.8c0-0.1,0-0.2,0-0.3\n",
+       "                    C81.8,14,77,9.8,71.5,10.2c-5,0.3-9,4.2-9.3,9.2c-0.2,5.5,4,10.1,9.5,10.3C71.8,29.7,72,29.7,72.1,29.7z M72.3,62.3\n",
+       "                    c-5.4-0.1-9.9,4.2-10.1,9.7c0,0.2,0,0.3,0,0.5c0.2,5.4,4.5,9.7,9.9,10c5.1,0.1,9.9-4.7,10.1-9.8c0.2-5.5-4-10-9.5-10.3\n",
+       "                    C72.6,62.3,72.4,62.3,72.3,62.3z M115,72.5c0.1,5.4,4.5,9.7,9.8,9.9c5.6-0.2,10-4.8,10-10.4c-0.2-5.4-4.6-9.7-10-9.7\n",
+       "                    c-5.3-0.1-9.8,4.2-9.9,9.5C115,72.1,115,72.3,115,72.5z M19.5,62.3c-5.4,0.1-9.8,4.4-10,9.8c-0.1,5.1,5.2,10.4,10.2,10.3\n",
+       "                    c5.6-0.2,10-4.9,9.8-10.5c-0.1-5.4-4.5-9.7-9.9-9.6C19.6,62.3,19.5,62.3,19.5,62.3z M71.8,134.6c5.9,0.2,10.3-3.9,10.4-9.6\n",
+       "                    c0.5-5.5-3.6-10.4-9.1-10.8c-5.5-0.5-10.4,3.6-10.8,9.1c0,0.5,0,0.9,0,1.4c-0.2,5.3,4,9.8,9.3,10\n",
+       "                    C71.6,134.6,71.7,134.6,71.8,134.6z\"/>\n",
+       "            </g>\n",
+       "        </svg>\n",
+       "        <table>\n",
+       "            <tr>\n",
+       "                <td style=\"text-align: left\"><b>Python version:</b></td>\n",
+       "                <td style=\"text-align: left\"><b>3.7.10</b></td>\n",
+       "            </tr>\n",
+       "            <tr>\n",
+       "                <td style=\"text-align: left\"><b>Ray version:</b></td>\n",
+       "                <td style=\"text-align: left\"><b> 3.0.0.dev0</b></td>\n",
+       "            </tr>\n",
+       "            <tr>\n",
+       "    <td style=\"text-align: left\"><b>Dashboard:</b></td>\n",
+       "    <td style=\"text-align: left\"><b><a href=\"http://127.0.0.1:8266\" target=\"_blank\">http://127.0.0.1:8266</a></b></td>\n",
+       "</tr>\n",
+       "\n",
+       "        </table>\n",
+       "    </div>\n",
+       "</div>\n"
+      ],
+      "text/plain": [
+       "RayContext(dashboard_url='127.0.0.1:8266', python_version='3.7.10', ray_version='3.0.0.dev0', ray_commit='{{RAY_COMMIT_SHA}}', address_info={'node_ip_address': '127.0.0.1', 'raylet_ip_address': '127.0.0.1', 'redis_address': None, 'object_store_address': '/tmp/ray/session_2022-07-20_18-45-26_127581_21006/sockets/plasma_store', 'raylet_socket_name': '/tmp/ray/session_2022-07-20_18-45-26_127581_21006/sockets/raylet', 'webui_url': '127.0.0.1:8266', 'session_dir': '/tmp/ray/session_2022-07-20_18-45-26_127581_21006', 'metrics_export_port': 63884, 'gcs_address': '127.0.0.1:63685', 'address': '127.0.0.1:63685', 'dashboard_agent_listen_port': 52365, 'node_id': 'c21f810137e56bd967ab3f246c66aadc5262e00bdbe19c34c23456e7'})"
+      ]
+     },
+     "execution_count": 2,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
    "source": [
     "from pprint import pprint\n",
     "import ray\n",
@@ -93,7 +154,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/"
@@ -101,7 +162,18 @@
     "id": "KlMz0dt9hYbS",
     "outputId": "e7234b52-08b4-49fc-e14c-72f283b893f2"
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "{'CPU': 16.0,\n",
+      " 'memory': 30436675994.0,\n",
+      " 'node:127.0.0.1': 1.0,\n",
+      " 'object_store_memory': 2147483648.0}\n"
+     ]
+    }
+   ],
    "source": [
     "pprint(ray.cluster_resources())"
    ]
@@ -126,7 +198,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "metadata": {
     "id": "gAbhv9OqhYbT"
    },
@@ -160,7 +232,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "metadata": {
     "id": "FbeYf1aF8ISK"
    },
@@ -180,7 +252,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 6,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/",
@@ -189,7 +261,157 @@
     "id": "8tugpr5S8gPq",
     "outputId": "3c57a348-12a7-4b6c-f9b2-fabdcb7a7c88"
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>pickup_community_area</th>\n",
+       "      <th>trip_start_month</th>\n",
+       "      <th>trip_start_hour</th>\n",
+       "      <th>trip_start_day</th>\n",
+       "      <th>trip_start_timestamp</th>\n",
+       "      <th>trip_miles</th>\n",
+       "      <th>dropoff_census_tract</th>\n",
+       "      <th>payment_type</th>\n",
+       "      <th>company</th>\n",
+       "      <th>trip_seconds</th>\n",
+       "      <th>dropoff_community_area</th>\n",
+       "      <th>is_big_tip</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>5</td>\n",
+       "      <td>19</td>\n",
+       "      <td>6</td>\n",
+       "      <td>1400269500</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>Credit Card</td>\n",
+       "      <td>Chicago Elite Cab Corp. (Chicago Carriag</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>False</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>3</td>\n",
+       "      <td>19</td>\n",
+       "      <td>5</td>\n",
+       "      <td>1362683700</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>Unknown</td>\n",
+       "      <td>Chicago Elite Cab Corp.</td>\n",
+       "      <td>300.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>False</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>60.0</td>\n",
+       "      <td>10</td>\n",
+       "      <td>2</td>\n",
+       "      <td>3</td>\n",
+       "      <td>1380593700</td>\n",
+       "      <td>12.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>Cash</td>\n",
+       "      <td>Taxi Affiliation Services</td>\n",
+       "      <td>1380.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>False</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>10.0</td>\n",
+       "      <td>10</td>\n",
+       "      <td>1</td>\n",
+       "      <td>2</td>\n",
+       "      <td>1382319000</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>Cash</td>\n",
+       "      <td>Taxi Affiliation Services</td>\n",
+       "      <td>180.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>False</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>14.0</td>\n",
+       "      <td>5</td>\n",
+       "      <td>7</td>\n",
+       "      <td>5</td>\n",
+       "      <td>1369897200</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>Cash</td>\n",
+       "      <td>Dispatch Taxi Affiliation</td>\n",
+       "      <td>1080.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>False</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   pickup_community_area  trip_start_month  trip_start_hour  trip_start_day  \\\n",
+       "0                    NaN                 5               19               6   \n",
+       "1                    NaN                 3               19               5   \n",
+       "2                   60.0                10                2               3   \n",
+       "3                   10.0                10                1               2   \n",
+       "4                   14.0                 5                7               5   \n",
+       "\n",
+       "   trip_start_timestamp  trip_miles  dropoff_census_tract payment_type  \\\n",
+       "0            1400269500         0.0                   NaN  Credit Card   \n",
+       "1            1362683700         0.0                   NaN      Unknown   \n",
+       "2            1380593700        12.6                   NaN         Cash   \n",
+       "3            1382319000         0.0                   NaN         Cash   \n",
+       "4            1369897200         0.0                   NaN         Cash   \n",
+       "\n",
+       "                                    company  trip_seconds  \\\n",
+       "0  Chicago Elite Cab Corp. (Chicago Carriag           0.0   \n",
+       "1                   Chicago Elite Cab Corp.         300.0   \n",
+       "2                 Taxi Affiliation Services        1380.0   \n",
+       "3                 Taxi Affiliation Services         180.0   \n",
+       "4                 Dispatch Taxi Affiliation        1080.0   \n",
+       "\n",
+       "   dropoff_community_area  is_big_tip  \n",
+       "0                     NaN       False  \n",
+       "1                     NaN       False  \n",
+       "2                     NaN       False  \n",
+       "3                     NaN       False  \n",
+       "4                     NaN       False  "
+      ]
+     },
+     "execution_count": 6,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
    "source": [
     "data.head(5)"
    ]
@@ -206,7 +428,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 7,
    "metadata": {
     "id": "YSLvrBMC9aRv"
    },
@@ -239,7 +461,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 8,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/"
@@ -247,7 +469,15 @@
     "id": "xfhRl7eO981w",
     "outputId": "f80d90ff-fc8a-4a7d-b544-31633823d596"
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "There are 11251 samples for training and 3751 samples for testing.\n"
+     ]
+    }
+   ],
    "source": [
     "print(f\"There are {train_ds.count()} samples for training and {test_df.shape[0]} samples for testing.\")"
    ]
@@ -286,7 +516,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 9,
    "metadata": {
     "id": "zVvslsfMIrIh"
    },
@@ -345,7 +575,8 @@
     "        result = {}\n",
     "        feature_cols = [col for col in dataframe.columns if col != LABEL]\n",
     "        result[\"input\"] = TensorArray(dataframe[feature_cols].to_numpy(dtype=np.float32))\n",
-    "        result[LABEL] = dataframe[LABEL]\n",
+    "        if LABEL in dataframe.columns:\n",
+    "            result[LABEL] = dataframe[LABEL]\n",
     "        return  pd.DataFrame(result)\n",
     "\n",
     "    chained_pp = Chain(\n",
@@ -372,7 +603,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 10,
    "metadata": {
     "id": "ejGVU-uN_dVP"
    },
@@ -414,7 +645,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 11,
    "metadata": {
     "id": "MwhAeEOuhYbV"
    },
@@ -557,7 +788,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 14,
    "metadata": {
     "id": "BBbcMwc9Rz66"
    },
@@ -582,7 +813,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 15,
    "metadata": {
     "id": "ujmwT8ZhScq1"
    },
@@ -608,7 +839,7 @@
     "        # This is due to a current limitation on Serve that's\n",
     "        # being addressed.\n",
     "        # TODO(xwjiang): Change to True.\n",
-    "        batching_params=False,\n",
+    "        batching_params=dict(max_batch_size=2, batch_wait_timeout_s=5),\n",
     "        model_definition=model_definition,\n",
     "        http_adapter=adapter,\n",
     "    )\n",
@@ -617,12 +848,27 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 16,
    "metadata": {
     "id": "uRe9a8947pl9"
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "2022-07-20 18:46:11,759\tINFO services.py:1483 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8266\u001b[39m\u001b[22m\n",
+      "\u001b[2m\u001b[36m(ServeController pid=21308)\u001b[0m INFO 2022-07-20 18:46:15,348 controller 21308 checkpoint_path.py:17 - Using RayInternalKVStore for controller checkpoint and recovery.\n",
+      "\u001b[2m\u001b[36m(ServeController pid=21308)\u001b[0m INFO 2022-07-20 18:46:15,350 controller 21308 http_state.py:126 - Starting HTTP proxy with name 'SERVE_CONTROLLER_ACTOR:SERVE_PROXY_ACTOR-58fb3ee046cdce5c602369291de78f60c65dcbd7c5c5a8af57ec3a26' on node '58fb3ee046cdce5c602369291de78f60c65dcbd7c5c5a8af57ec3a26' listening on '127.0.0.1:8000'\n",
+      "\u001b[2m\u001b[36m(HTTPProxyActor pid=21311)\u001b[0m INFO:     Started server process [21311]\n",
+      "/Users/jiaodong/anaconda3/envs/ray3.7/lib/python3.7/site-packages/ipykernel_launcher.py:23: UserWarning: From /var/folders/1s/wy6f3ytn3q726p5hl8fw8d780000gn/T/ipykernel_21006/609683685.py:23: deploy (from ray.serve.deployment) is deprecated and will be removed in a future version Please see https://docs.ray.io/en/latest/serve/index.html\n",
+      "\u001b[2m\u001b[36m(ServeController pid=21308)\u001b[0m INFO 2022-07-20 18:46:17,658 controller 21308 deployment_state.py:1281 - Adding 1 replicas to deployment 'Model'.\n",
+      "\u001b[2m\u001b[36m(ServeReplica:Model pid=21314)\u001b[0m 2022-07-20 18:46:23,199\tWARNING compression.py:18 -- lz4 not available, disabling sample compression. This will significantly impact RLlib performance. To install lz4, run `pip install lz4`.\n"
+     ]
+    }
+   ],
    "source": [
+    "import ray\n",
     "# Generally speaking, training and serving are done in totally different ray clusters.\n",
     "# To simulate that, let's shutdown the old ray cluster in preparation for serving.\n",
     "ray.shutdown()\n",
@@ -641,33 +887,106 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 19,
    "metadata": {
     "id": "E9m80HDmSz66"
    },
    "outputs": [],
    "source": [
     "import requests\n",
+    "import pandas as pd\n",
+    "import numpy as np\n",
     "\n",
-    "NUM_SERVE_REQUESTS = 100\n",
+    "NUM_SERVE_REQUESTS = 10\n",
     "\n",
     "def send_requests(df: pd.DataFrame, label: np.array):\n",
     "    for i in range(NUM_SERVE_REQUESTS):\n",
     "        one_row = df.iloc[[i]].to_dict()\n",
     "        serve_result = requests.post(endpoint_uri, json=one_row).json()\n",
     "        print(\n",
-    "            f\"request[{i}] prediction: {serve_result['predictions']['0']} \"\n",
+    "            f\"request{i} prediction: {serve_result[0]['predictions']} \"\n",
     "            f\"- label: {str(label[i])}\"\n",
     "        )"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 20,
    "metadata": {
     "id": "GFPwKc5JTgnI"
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "request0 prediction: 0.004963837098330259 - label: True\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "request1 prediction: 6.652726733591408e-05 - label: False\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "request2 prediction: 0.00018405025184620172 - label: False\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "request3 prediction: 0.00016512417641934007 - label: False\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "request4 prediction: 0.00015515758423134685 - label: False\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "request5 prediction: 5.948602483840659e-05 - label: False\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "request6 prediction: 9.51739348238334e-05 - label: False\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "request7 prediction: 3.4787988170137396e-06 - label: False\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "request8 prediction: 0.00010751552326837555 - label: False\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "request9 prediction: 0.060329731553792953 - label: True\n"
+     ]
+    }
+   ],
    "source": [
     "send_requests(test_df, test_label)"
    ]
@@ -682,11 +1001,8 @@
    "name": "tfx (1) (1) (1).ipynb",
    "provenance": []
   },
-  "interpreter": {
-   "hash": "3c0d54d489a08ae47a06eae2fd00ff032d6cddb527c382959b7b2575f6a8167f"
-  },
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "Python 3.7.10 ('ray3.7')",
    "language": "python",
    "name": "python3"
   },
@@ -700,7 +1016,12 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.6"
+   "version": "3.7.10"
+  },
+  "vscode": {
+   "interpreter": {
+    "hash": "99d89bfe98f3aa2d7facda0d08d31ff2a0af9559e5330d719288ce64a1966273"
+   }
   }
  },
  "nbformat": 4,
diff --git a/doc/source/ray-air/examples/torch_incremental_learning.ipynb b/doc/source/ray-air/examples/torch_incremental_learning.ipynb
index b7fb2c72aa27..6dc76215bfaf 100644
--- a/doc/source/ray-air/examples/torch_incremental_learning.ipynb
+++ b/doc/source/ray-air/examples/torch_incremental_learning.ipynb
@@ -75,133 +75,7 @@
     "id": "kWr6BRMk1Y1j",
     "outputId": "dad49a31-a602-4e44-b5fe-932de603925e"
    },
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
-      "Requirement already satisfied: ray[data,serve,tune] in /usr/local/lib/python3.7/dist-packages (2.0.0.dev0)\n",
-      "Requirement already satisfied: numpy>=1.16 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (1.21.6)\n",
-      "Requirement already satisfied: filelock in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (3.7.0)\n",
-      "Requirement already satisfied: grpcio!=1.44.0,>=1.28.1 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (1.43.0)\n",
-      "Requirement already satisfied: msgpack<2.0.0,>=1.0.0 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (1.0.3)\n",
-      "Requirement already satisfied: protobuf>=3.15.3 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (3.17.3)\n",
-      "Requirement already satisfied: aiosignal in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (1.2.0)\n",
-      "Requirement already satisfied: frozenlist in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (1.3.0)\n",
-      "Requirement already satisfied: virtualenv in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (20.14.1)\n",
-      "Requirement already satisfied: pyyaml in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (3.13)\n",
-      "Requirement already satisfied: attrs in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (21.4.0)\n",
-      "Requirement already satisfied: click<=8.0.4,>=7.0 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (7.1.2)\n",
-      "Requirement already satisfied: requests in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (2.23.0)\n",
-      "Requirement already satisfied: jsonschema in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (4.3.3)\n",
-      "Requirement already satisfied: pyarrow<7.0.0,>=6.0.1 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (6.0.1)\n",
-      "Requirement already satisfied: fsspec in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (2022.5.0)\n",
-      "Requirement already satisfied: pandas in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (1.3.5)\n",
-      "Requirement already satisfied: tensorboardX>=1.9 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (2.5)\n",
-      "Requirement already satisfied: tabulate in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (0.8.9)\n",
-      "Requirement already satisfied: aiorwlock in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (1.3.0)\n",
-      "Requirement already satisfied: starlette in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (0.19.1)\n",
-      "Requirement already satisfied: prometheus-client<0.14.0,>=0.7.1 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (0.13.1)\n",
-      "Requirement already satisfied: py-spy>=0.2.0 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (0.3.12)\n",
-      "Requirement already satisfied: smart-open in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (6.0.0)\n",
-      "Requirement already satisfied: gpustat>=1.0.0b1 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (1.0.0b1)\n",
-      "Requirement already satisfied: colorful in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (0.5.4)\n",
-      "Requirement already satisfied: aiohttp>=3.7 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (3.8.1)\n",
-      "Requirement already satisfied: fastapi in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (0.78.0)\n",
-      "Requirement already satisfied: aiohttp-cors in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (0.7.0)\n",
-      "Requirement already satisfied: uvicorn==0.16.0 in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (0.16.0)\n",
-      "Requirement already satisfied: opencensus in /usr/local/lib/python3.7/dist-packages (from ray[data,serve,tune]) (0.9.0)\n",
-      "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.7/dist-packages (from uvicorn==0.16.0->ray[data,serve,tune]) (4.2.0)\n",
-      "Requirement already satisfied: asgiref>=3.4.0 in /usr/local/lib/python3.7/dist-packages (from uvicorn==0.16.0->ray[data,serve,tune]) (3.5.2)\n",
-      "Requirement already satisfied: h11>=0.8 in /usr/local/lib/python3.7/dist-packages (from uvicorn==0.16.0->ray[data,serve,tune]) (0.13.0)\n",
-      "Requirement already satisfied: asynctest==0.13.0 in /usr/local/lib/python3.7/dist-packages (from aiohttp>=3.7->ray[data,serve,tune]) (0.13.0)\n",
-      "Requirement already satisfied: charset-normalizer<3.0,>=2.0 in /usr/local/lib/python3.7/dist-packages (from aiohttp>=3.7->ray[data,serve,tune]) (2.0.12)\n",
-      "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.7/dist-packages (from aiohttp>=3.7->ray[data,serve,tune]) (6.0.2)\n",
-      "Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /usr/local/lib/python3.7/dist-packages (from aiohttp>=3.7->ray[data,serve,tune]) (4.0.2)\n",
-      "Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.7/dist-packages (from aiohttp>=3.7->ray[data,serve,tune]) (1.7.2)\n",
-      "Requirement already satisfied: psutil in /usr/local/lib/python3.7/dist-packages (from gpustat>=1.0.0b1->ray[data,serve,tune]) (5.4.8)\n",
-      "Requirement already satisfied: six>=1.7 in /usr/local/lib/python3.7/dist-packages (from gpustat>=1.0.0b1->ray[data,serve,tune]) (1.15.0)\n",
-      "Requirement already satisfied: blessed>=1.17.1 in /usr/local/lib/python3.7/dist-packages (from gpustat>=1.0.0b1->ray[data,serve,tune]) (1.19.1)\n",
-      "Requirement already satisfied: nvidia-ml-py3>=7.352.0 in /usr/local/lib/python3.7/dist-packages (from gpustat>=1.0.0b1->ray[data,serve,tune]) (7.352.0)\n",
-      "Requirement already satisfied: wcwidth>=0.1.4 in /usr/local/lib/python3.7/dist-packages (from blessed>=1.17.1->gpustat>=1.0.0b1->ray[data,serve,tune]) (0.2.5)\n",
-      "Requirement already satisfied: idna>=2.0 in /usr/local/lib/python3.7/dist-packages (from yarl<2.0,>=1.0->aiohttp>=3.7->ray[data,serve,tune]) (2.10)\n",
-      "Requirement already satisfied: pydantic!=1.7,!=1.7.1,!=1.7.2,!=1.7.3,!=1.8,!=1.8.1,<2.0.0,>=1.6.2 in /usr/local/lib/python3.7/dist-packages (from fastapi->ray[data,serve,tune]) (1.9.1)\n",
-      "Requirement already satisfied: anyio<5,>=3.4.0 in /usr/local/lib/python3.7/dist-packages (from starlette->ray[data,serve,tune]) (3.6.1)\n",
-      "Requirement already satisfied: sniffio>=1.1 in /usr/local/lib/python3.7/dist-packages (from anyio<5,>=3.4.0->starlette->ray[data,serve,tune]) (1.2.0)\n",
-      "Requirement already satisfied: importlib-resources>=1.4.0 in /usr/local/lib/python3.7/dist-packages (from jsonschema->ray[data,serve,tune]) (5.7.1)\n",
-      "Requirement already satisfied: pyrsistent!=0.17.0,!=0.17.1,!=0.17.2,>=0.14.0 in /usr/local/lib/python3.7/dist-packages (from jsonschema->ray[data,serve,tune]) (0.18.1)\n",
-      "Requirement already satisfied: importlib-metadata in /usr/local/lib/python3.7/dist-packages (from jsonschema->ray[data,serve,tune]) (4.11.3)\n",
-      "Requirement already satisfied: zipp>=3.1.0 in /usr/local/lib/python3.7/dist-packages (from importlib-resources>=1.4.0->jsonschema->ray[data,serve,tune]) (3.8.0)\n",
-      "Requirement already satisfied: google-api-core<3.0.0,>=1.0.0 in /usr/local/lib/python3.7/dist-packages (from opencensus->ray[data,serve,tune]) (1.31.5)\n",
-      "Requirement already satisfied: opencensus-context>=0.1.2 in /usr/local/lib/python3.7/dist-packages (from opencensus->ray[data,serve,tune]) (0.1.2)\n",
-      "Requirement already satisfied: pytz in /usr/local/lib/python3.7/dist-packages (from google-api-core<3.0.0,>=1.0.0->opencensus->ray[data,serve,tune]) (2022.1)\n",
-      "Requirement already satisfied: google-auth<2.0dev,>=1.25.0 in /usr/local/lib/python3.7/dist-packages (from google-api-core<3.0.0,>=1.0.0->opencensus->ray[data,serve,tune]) (1.35.0)\n",
-      "Requirement already satisfied: googleapis-common-protos<2.0dev,>=1.6.0 in /usr/local/lib/python3.7/dist-packages (from google-api-core<3.0.0,>=1.0.0->opencensus->ray[data,serve,tune]) (1.56.1)\n",
-      "Requirement already satisfied: setuptools>=40.3.0 in /usr/local/lib/python3.7/dist-packages (from google-api-core<3.0.0,>=1.0.0->opencensus->ray[data,serve,tune]) (57.4.0)\n",
-      "Requirement already satisfied: packaging>=14.3 in /usr/local/lib/python3.7/dist-packages (from google-api-core<3.0.0,>=1.0.0->opencensus->ray[data,serve,tune]) (21.3)\n",
-      "Requirement already satisfied: pyasn1-modules>=0.2.1 in /usr/local/lib/python3.7/dist-packages (from google-auth<2.0dev,>=1.25.0->google-api-core<3.0.0,>=1.0.0->opencensus->ray[data,serve,tune]) (0.2.8)\n",
-      "Requirement already satisfied: rsa<5,>=3.1.4 in /usr/local/lib/python3.7/dist-packages (from google-auth<2.0dev,>=1.25.0->google-api-core<3.0.0,>=1.0.0->opencensus->ray[data,serve,tune]) (4.8)\n",
-      "Requirement already satisfied: cachetools<5.0,>=2.0.0 in /usr/local/lib/python3.7/dist-packages (from google-auth<2.0dev,>=1.25.0->google-api-core<3.0.0,>=1.0.0->opencensus->ray[data,serve,tune]) (4.2.4)\n",
-      "Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /usr/local/lib/python3.7/dist-packages (from packaging>=14.3->google-api-core<3.0.0,>=1.0.0->opencensus->ray[data,serve,tune]) (3.0.9)\n",
-      "Requirement already satisfied: pyasn1<0.5.0,>=0.4.6 in /usr/local/lib/python3.7/dist-packages (from pyasn1-modules>=0.2.1->google-auth<2.0dev,>=1.25.0->google-api-core<3.0.0,>=1.0.0->opencensus->ray[data,serve,tune]) (0.4.8)\n",
-      "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests->ray[data,serve,tune]) (1.24.3)\n",
-      "Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests->ray[data,serve,tune]) (3.0.4)\n",
-      "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests->ray[data,serve,tune]) (2022.5.18.1)\n",
-      "Requirement already satisfied: python-dateutil>=2.7.3 in /usr/local/lib/python3.7/dist-packages (from pandas->ray[data,serve,tune]) (2.8.2)\n",
-      "Requirement already satisfied: distlib<1,>=0.3.1 in /usr/local/lib/python3.7/dist-packages (from virtualenv->ray[data,serve,tune]) (0.3.4)\n",
-      "Requirement already satisfied: platformdirs<3,>=2 in /usr/local/lib/python3.7/dist-packages (from virtualenv->ray[data,serve,tune]) (2.5.2)\n",
-      "Found existing installation: ray 2.0.0.dev0\n",
-      "Uninstalling ray-2.0.0.dev0:\n",
-      "  Successfully uninstalled ray-2.0.0.dev0\n",
-      "Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
-      "Collecting ray==3.0.0.dev0\n",
-      "  Downloading https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-3.0.0.dev0-cp37-cp37m-manylinux2014_x86_64.whl (54.9 MB)\n",
-      "\u001b[K     |████████████████████████████████| 54.9 MB 74.4 MB/s \n",
-      "\u001b[?25hRequirement already satisfied: msgpack<2.0.0,>=1.0.0 in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (1.0.3)\n",
-      "Requirement already satisfied: virtualenv in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (20.14.1)\n",
-      "Requirement already satisfied: protobuf>=3.15.3 in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (3.17.3)\n",
-      "Requirement already satisfied: pyyaml in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (3.13)\n",
-      "Requirement already satisfied: click<=8.0.4,>=7.0 in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (7.1.2)\n",
-      "Requirement already satisfied: attrs in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (21.4.0)\n",
-      "Requirement already satisfied: requests in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (2.23.0)\n",
-      "Requirement already satisfied: frozenlist in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (1.3.0)\n",
-      "Requirement already satisfied: aiosignal in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (1.2.0)\n",
-      "Requirement already satisfied: numpy>=1.16 in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (1.21.6)\n",
-      "Requirement already satisfied: jsonschema in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (4.3.3)\n",
-      "Requirement already satisfied: grpcio<=1.43.0,>=1.28.1 in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (1.43.0)\n",
-      "Requirement already satisfied: filelock in /usr/local/lib/python3.7/dist-packages (from ray==3.0.0.dev0) (3.7.0)\n",
-      "Requirement already satisfied: six>=1.5.2 in /usr/local/lib/python3.7/dist-packages (from grpcio<=1.43.0,>=1.28.1->ray==3.0.0.dev0) (1.15.0)\n",
-      "Requirement already satisfied: pyrsistent!=0.17.0,!=0.17.1,!=0.17.2,>=0.14.0 in /usr/local/lib/python3.7/dist-packages (from jsonschema->ray==3.0.0.dev0) (0.18.1)\n",
-      "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.7/dist-packages (from jsonschema->ray==3.0.0.dev0) (4.2.0)\n",
-      "Requirement already satisfied: importlib-metadata in /usr/local/lib/python3.7/dist-packages (from jsonschema->ray==3.0.0.dev0) (4.11.3)\n",
-      "Requirement already satisfied: importlib-resources>=1.4.0 in /usr/local/lib/python3.7/dist-packages (from jsonschema->ray==3.0.0.dev0) (5.7.1)\n",
-      "Requirement already satisfied: zipp>=3.1.0 in /usr/local/lib/python3.7/dist-packages (from importlib-resources>=1.4.0->jsonschema->ray==3.0.0.dev0) (3.8.0)\n",
-      "Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests->ray==3.0.0.dev0) (2.10)\n",
-      "Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests->ray==3.0.0.dev0) (3.0.4)\n",
-      "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests->ray==3.0.0.dev0) (1.24.3)\n",
-      "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests->ray==3.0.0.dev0) (2022.5.18.1)\n",
-      "Requirement already satisfied: platformdirs<3,>=2 in /usr/local/lib/python3.7/dist-packages (from virtualenv->ray==3.0.0.dev0) (2.5.2)\n",
-      "Requirement already satisfied: distlib<1,>=0.3.1 in /usr/local/lib/python3.7/dist-packages (from virtualenv->ray==3.0.0.dev0) (0.3.4)\n",
-      "Installing collected packages: ray\n",
-      "Successfully installed ray-3.0.0.dev0\n",
-      "Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
-      "Requirement already satisfied: torch in /usr/local/lib/python3.7/dist-packages (1.11.0+cu113)\n",
-      "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.7/dist-packages (from torch) (4.2.0)\n",
-      "Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
-      "Requirement already satisfied: torchvision in /usr/local/lib/python3.7/dist-packages (0.12.0+cu113)\n",
-      "Requirement already satisfied: requests in /usr/local/lib/python3.7/dist-packages (from torchvision) (2.23.0)\n",
-      "Requirement already satisfied: pillow!=8.3.*,>=5.3.0 in /usr/local/lib/python3.7/dist-packages (from torchvision) (7.1.2)\n",
-      "Requirement already satisfied: numpy in /usr/local/lib/python3.7/dist-packages (from torchvision) (1.21.6)\n",
-      "Requirement already satisfied: torch==1.11.0 in /usr/local/lib/python3.7/dist-packages (from torchvision) (1.11.0+cu113)\n",
-      "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.7/dist-packages (from torchvision) (4.2.0)\n",
-      "Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests->torchvision) (2.10)\n",
-      "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests->torchvision) (2022.5.18.1)\n",
-      "Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests->torchvision) (3.0.4)\n",
-      "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests->torchvision) (1.24.3)\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "# !pip install -q \"ray[air]\"\n",
     "# !pip install -q torch\n",
@@ -232,13 +106,56 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-25 22:25:31,150\tINFO services.py:1483 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8265\u001b[39m\u001b[22m\n"
+      "2022-07-20 21:47:49,873\tINFO services.py:1483 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8265\u001b[39m\u001b[22m\n"
      ]
     },
     {
      "data": {
+      "text/html": [
+       "<div>\n",
+       "    <div style=\"margin-left: 50px;display: flex;flex-direction: row;align-items: center\">\n",
+       "        <h3 style=\"color: var(--jp-ui-font-color0)\">Ray</h3>\n",
+       "        <svg version=\"1.1\" id=\"ray\" width=\"3em\" viewBox=\"0 0 144.5 144.6\" style=\"margin-left: 3em;margin-right: 3em\">\n",
+       "            <g id=\"layer-1\">\n",
+       "                <path fill=\"#00a2e9\" class=\"st0\" d=\"M97.3,77.2c-3.8-1.1-6.2,0.9-8.3,5.1c-3.5,6.8-9.9,9.9-17.4,9.6S58,88.1,54.8,81.2c-1.4-3-3-4-6.3-4.1\n",
+       "                    c-5.6-0.1-9.9,0.1-13.1,6.4c-3.8,7.6-13.6,10.2-21.8,7.6C5.2,88.4-0.4,80.5,0,71.7c0.1-8.4,5.7-15.8,13.8-18.2\n",
+       "                    c8.4-2.6,17.5,0.7,22.3,8c1.3,1.9,1.3,5.2,3.6,5.6c3.9,0.6,8,0.2,12,0.2c1.8,0,1.9-1.6,2.4-2.8c3.5-7.8,9.7-11.8,18-11.9\n",
+       "                    c8.2-0.1,14.4,3.9,17.8,11.4c1.3,2.8,2.9,3.6,5.7,3.3c1-0.1,2,0.1,3,0c2.8-0.5,6.4,1.7,8.1-2.7s-2.3-5.5-4.1-7.5\n",
+       "                    c-5.1-5.7-10.9-10.8-16.1-16.3C84,38,81.9,37.1,78,38.3C66.7,42,56.2,35.7,53,24.1C50.3,14,57.3,2.8,67.7,0.5\n",
+       "                    C78.4-2,89,4.7,91.5,15.3c0.1,0.3,0.1,0.5,0.2,0.8c0.7,3.4,0.7,6.9-0.8,9.8c-1.7,3.2-0.8,5,1.5,7.2c6.7,6.5,13.3,13,19.8,19.7\n",
+       "                    c1.8,1.8,3,2.1,5.5,1.2c9.1-3.4,17.9-0.6,23.4,7c4.8,6.9,4.6,16.1-0.4,22.9c-5.4,7.2-14.2,9.9-23.1,6.5c-2.3-0.9-3.5-0.6-5.1,1.1\n",
+       "                    c-6.7,6.9-13.6,13.7-20.5,20.4c-1.8,1.8-2.5,3.2-1.4,5.9c3.5,8.7,0.3,18.6-7.7,23.6c-7.9,5-18.2,3.8-24.8-2.9\n",
+       "                    c-6.4-6.4-7.4-16.2-2.5-24.3c4.9-7.8,14.5-11,23.1-7.8c3,1.1,4.7,0.5,6.9-1.7C91.7,98.4,98,92.3,104.2,86c1.6-1.6,4.1-2.7,2.6-6.2\n",
+       "                    c-1.4-3.3-3.8-2.5-6.2-2.6C99.8,77.2,98.9,77.2,97.3,77.2z M72.1,29.7c5.5,0.1,9.9-4.3,10-9.8c0-0.1,0-0.2,0-0.3\n",
+       "                    C81.8,14,77,9.8,71.5,10.2c-5,0.3-9,4.2-9.3,9.2c-0.2,5.5,4,10.1,9.5,10.3C71.8,29.7,72,29.7,72.1,29.7z M72.3,62.3\n",
+       "                    c-5.4-0.1-9.9,4.2-10.1,9.7c0,0.2,0,0.3,0,0.5c0.2,5.4,4.5,9.7,9.9,10c5.1,0.1,9.9-4.7,10.1-9.8c0.2-5.5-4-10-9.5-10.3\n",
+       "                    C72.6,62.3,72.4,62.3,72.3,62.3z M115,72.5c0.1,5.4,4.5,9.7,9.8,9.9c5.6-0.2,10-4.8,10-10.4c-0.2-5.4-4.6-9.7-10-9.7\n",
+       "                    c-5.3-0.1-9.8,4.2-9.9,9.5C115,72.1,115,72.3,115,72.5z M19.5,62.3c-5.4,0.1-9.8,4.4-10,9.8c-0.1,5.1,5.2,10.4,10.2,10.3\n",
+       "                    c5.6-0.2,10-4.9,9.8-10.5c-0.1-5.4-4.5-9.7-9.9-9.6C19.6,62.3,19.5,62.3,19.5,62.3z M71.8,134.6c5.9,0.2,10.3-3.9,10.4-9.6\n",
+       "                    c0.5-5.5-3.6-10.4-9.1-10.8c-5.5-0.5-10.4,3.6-10.8,9.1c0,0.5,0,0.9,0,1.4c-0.2,5.3,4,9.8,9.3,10\n",
+       "                    C71.6,134.6,71.7,134.6,71.8,134.6z\"/>\n",
+       "            </g>\n",
+       "        </svg>\n",
+       "        <table>\n",
+       "            <tr>\n",
+       "                <td style=\"text-align: left\"><b>Python version:</b></td>\n",
+       "                <td style=\"text-align: left\"><b>3.7.10</b></td>\n",
+       "            </tr>\n",
+       "            <tr>\n",
+       "                <td style=\"text-align: left\"><b>Ray version:</b></td>\n",
+       "                <td style=\"text-align: left\"><b> 3.0.0.dev0</b></td>\n",
+       "            </tr>\n",
+       "            <tr>\n",
+       "    <td style=\"text-align: left\"><b>Dashboard:</b></td>\n",
+       "    <td style=\"text-align: left\"><b><a href=\"http://127.0.0.1:8265\" target=\"_blank\">http://127.0.0.1:8265</a></b></td>\n",
+       "</tr>\n",
+       "\n",
+       "        </table>\n",
+       "    </div>\n",
+       "</div>\n"
+      ],
       "text/plain": [
-       "RayContext(dashboard_url='127.0.0.1:8265', python_version='3.7.13', ray_version='3.0.0.dev0', ray_commit='ac620aeec0c0f68c92328ace0b2a5835f5b14b26', address_info={'node_ip_address': '172.28.0.2', 'raylet_ip_address': '172.28.0.2', 'redis_address': None, 'object_store_address': '/tmp/ray/session_2022-05-25_22-25-28_641559_1518/sockets/plasma_store', 'raylet_socket_name': '/tmp/ray/session_2022-05-25_22-25-28_641559_1518/sockets/raylet', 'webui_url': '127.0.0.1:8265', 'session_dir': '/tmp/ray/session_2022-05-25_22-25-28_641559_1518', 'metrics_export_port': 61030, 'gcs_address': '172.28.0.2:62940', 'address': '172.28.0.2:62940', 'node_id': '97455d0de12f3393126427ed2b1ef0a009f0bd3fb97177cb86b42d92'})"
+       "RayContext(dashboard_url='127.0.0.1:8265', python_version='3.7.10', ray_version='3.0.0.dev0', ray_commit='{{RAY_COMMIT_SHA}}', address_info={'node_ip_address': '127.0.0.1', 'raylet_ip_address': '127.0.0.1', 'redis_address': None, 'object_store_address': '/tmp/ray/session_2022-07-20_21-47-47_297236_39344/sockets/plasma_store', 'raylet_socket_name': '/tmp/ray/session_2022-07-20_21-47-47_297236_39344/sockets/raylet', 'webui_url': '127.0.0.1:8265', 'session_dir': '/tmp/ray/session_2022-07-20_21-47-47_297236_39344', 'metrics_export_port': 62008, 'gcs_address': '127.0.0.1:57307', 'address': '127.0.0.1:57307', 'dashboard_agent_listen_port': 52365, 'node_id': 'db68eafa3bbe9042df574f3c9974b40ce8d97728db90282feefb4690'})"
       ]
      },
      "execution_count": 2,
@@ -266,7 +183,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": null,
    "metadata": {
     "id": "3TVkSmFFCHhI"
    },
@@ -595,6 +512,7 @@
    "outputs": [],
    "source": [
     "from ray.data.preprocessors import BatchMapper\n",
+    "from ray.data.extensions import TensorArray\n",
     "\n",
     "from torchvision import transforms\n",
     "\n",
@@ -605,7 +523,7 @@
     "      [transforms.ToTensor(), transforms.Normalize((0.1307,), (0.3081,))]\n",
     "    )\n",
     "\n",
-    "    df[\"image\"] = df[\"image\"].map(torchvision_transforms)\n",
+    "    df[\"image\"] = TensorArray([torchvision_transforms(image) for image in df[\"image\"]])\n",
     "    return df\n",
     "\n",
     "mnist_normalize_preprocessor = BatchMapper(fn=preprocess_images)"
@@ -704,7 +622,13 @@
     "      return df\n",
     "\n",
     "  deployment = PredictorDeployment.options(name=\"mnist_model\", route_prefix=\"/mnist_predict\", version=f\"v{task_idx}\", num_replicas=2)\n",
-    "  deployment.deploy(batching_params=False, http_adapter=json_to_pandas, predictor_cls=TorchPredictor, checkpoint=latest_checkpoint, model=SimpleMLP(num_classes=10))\n",
+    "  deployment.deploy(\n",
+    "    batching_params=dict(max_batch_size=10, batch_wait_timeout_s=5),\n",
+    "    http_adapter=json_to_pandas, \n",
+    "    predictor_cls=TorchPredictor, \n",
+    "    checkpoint=latest_checkpoint, \n",
+    "    model=SimpleMLP(num_classes=10)\n",
+    "  )\n",
     "  return deployment.url\n",
     "\n",
     "# Function that queries our deployed model\n",
@@ -753,14 +677,11 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(_prepare_read pid=1772)\u001b[0m 2022-05-25 22:25:35,236\tWARNING torch_datasource.py:56 -- `SimpleTorchDatasource` doesn't support parallel reads. The `parallelism` argument will be ignored.\n",
-      "Read->Map_Batches: 100%|██████████| 1/1 [00:05<00:00,  5.92s/it]\n",
-      "\u001b[2m\u001b[36m(_prepare_read pid=1772)\u001b[0m 2022-05-25 22:25:53,593\tWARNING torch_datasource.py:56 -- `SimpleTorchDatasource` doesn't support parallel reads. The `parallelism` argument will be ignored.\n",
-      "Read->Map_Batches: 100%|██████████| 1/1 [00:00<00:00,  2.51it/s]\n",
-      "Map Progress (2 actors 1 pending): 100%|██████████| 1/1 [00:02<00:00,  2.72s/it]\n",
-      "\u001b[2m\u001b[36m(_prepare_read pid=1978)\u001b[0m 2022-05-25 22:25:58,761\tWARNING torch_datasource.py:56 -- `SimpleTorchDatasource` doesn't support parallel reads. The `parallelism` argument will be ignored.\n",
-      "Read->Map_Batches: 100%|██████████| 1/1 [00:00<00:00,  2.41it/s]\n",
-      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.37s/it]"
+      "Read->Map_Batches: 100%|██████████| 1/1 [00:06<00:00,  6.40s/it]\n",
+      "Read->Map_Batches: 100%|██████████| 1/1 [00:00<00:00,  2.12it/s]\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:02<00:00,  2.34s/it]\n",
+      "Read->Map_Batches: 100%|██████████| 1/1 [00:00<00:00,  2.29it/s]\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.33s/it]\n"
      ]
     },
     {
@@ -770,22 +691,15 @@
       "Starting training for task: 0\n"
      ]
     },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "\n"
-     ]
-    },
     {
      "data": {
       "text/html": [
-       "== Status ==<br>Current time: 2022-05-25 22:27:16 (running for 00:01:14.46)<br>Memory usage on this node: 4.7/12.7 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/2 CPUs, 0/1 GPUs, 0.0/7.31 GiB heap, 0.0/3.66 GiB objects (0.0/1.0 accelerator_type:T4)<br>Result logdir: /root/ray_results/TorchTrainer_2022-05-25_22-26-01<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
+       "== Status ==<br>Current time: 2022-07-20 21:48:52 (running for 00:00:39.66)<br>Memory usage on this node: 33.1/64.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/28.14 GiB heap, 0.0/2.0 GiB objects<br>Result logdir: /Users/jiaodong/ray_results/TorchTrainer_2022-07-20_21-48-13<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
        "<thead>\n",
-       "<tr><th>Trial name              </th><th>status    </th><th>loc            </th></tr>\n",
+       "<tr><th>Trial name              </th><th>status    </th><th>loc            </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">   loss</th><th style=\"text-align: right;\">  _timestamp</th><th style=\"text-align: right;\">  _time_this_iter_s</th></tr>\n",
        "</thead>\n",
        "<tbody>\n",
-       "<tr><td>TorchTrainer_a8585_00000</td><td>TERMINATED</td><td>172.28.0.2:2126</td></tr>\n",
+       "<tr><td>TorchTrainer_53c58_00000</td><td>TERMINATED</td><td>127.0.0.1:39548</td><td style=\"text-align: right;\">     4</td><td style=\"text-align: right;\">         36.4582</td><td style=\"text-align: right;\">824.229</td><td style=\"text-align: right;\">  1658378932</td><td style=\"text-align: right;\">            6.46339</td></tr>\n",
        "</tbody>\n",
        "</table><br><br>"
       ],
@@ -800,125 +714,102 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(_map_block_nosplit pid=2159)\u001b[0m /usr/local/lib/python3.7/dist-packages/torchvision/transforms/functional.py:133: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:178.)\n",
-      "\u001b[2m\u001b[36m(_map_block_nosplit pid=2159)\u001b[0m   img = torch.from_numpy(pic.transpose((2, 0, 1))).contiguous()\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m 2022-05-25 22:26:19,944\tINFO torch.py:347 -- Setting up process group for: env:// [rank=0, world_size=1]\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m 2022-05-25 22:26:20,033\tINFO torch.py:98 -- Moving model to device: cuda:0\n"
+      "2022-07-20 21:48:13,244\tINFO plugin_schema_manager.py:52 -- Loading the default runtime env schemas: ['/Users/jiaodong/Workspace/ray/python/ray/_private/runtime_env/../../runtime_env/schemas/working_dir_schema.json', '/Users/jiaodong/Workspace/ray/python/ray/_private/runtime_env/../../runtime_env/schemas/pip_schema.json'].\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 2.315190, epoch: 0, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 1.464406, epoch: 0, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 1.279081, epoch: 0, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 1.052461, epoch: 0, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 0.816213, epoch: 1, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 1.019127, epoch: 1, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 0.525613, epoch: 1, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 0.570595, epoch: 1, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 0.572004, epoch: 2, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 0.543432, epoch: 2, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 0.350156, epoch: 2, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 0.443743, epoch: 2, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 0.438318, epoch: 3, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 0.342512, epoch: 3, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 0.302048, epoch: 3, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2197)\u001b[0m loss: 0.414025, epoch: 3, iteration: 1500\n"
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 2.282040, epoch: 0, iteration: 0\n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-25 22:27:16,013\tERROR checkpoint_manager.py:193 -- Result dict has no key: training_iteration. checkpoint_score_attr must be set to a key of the result dict. Valid keys are ['trial_id', 'experiment_id', 'date', 'timestamp', 'pid', 'hostname', 'node_ip', 'config', 'done']\n"
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m 2022-07-20 21:48:26,772\tINFO train_loop_utils.py:298 -- Moving model to device: cpu\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Trial TorchTrainer_a8585_00000 completed. Last result: \n"
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 1.521038, epoch: 0, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 1.169452, epoch: 0, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.856338, epoch: 0, iteration: 1500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.788410, epoch: 1, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.854239, epoch: 1, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.533351, epoch: 1, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.591339, epoch: 1, iteration: 1500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.457057, epoch: 2, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.594715, epoch: 2, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.477588, epoch: 2, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.235412, epoch: 2, iteration: 1500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.507374, epoch: 3, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.447128, epoch: 3, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.381943, epoch: 3, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39562)\u001b[0m loss: 0.347877, epoch: 3, iteration: 1500\n",
+      "Result for TorchTrainer_53c58_00000:\n",
+      "  _time_this_iter_s: 6.463389873504639\n",
+      "  _timestamp: 1658378932\n",
+      "  _training_iteration: 4\n",
+      "  date: 2022-07-20_21-48-52\n",
+      "  done: true\n",
+      "  experiment_id: abc531ef544440268933d8221addeb9d\n",
+      "  experiment_tag: '0'\n",
+      "  hostname: Jiaos-MacBook-Pro-16-inch-2019\n",
+      "  iterations_since_restore: 4\n",
+      "  loss: 824.2287287414074\n",
+      "  node_ip: 127.0.0.1\n",
+      "  pid: 39548\n",
+      "  should_checkpoint: true\n",
+      "  time_since_restore: 36.45815992355347\n",
+      "  time_this_iter_s: 6.464020013809204\n",
+      "  time_total_s: 36.45815992355347\n",
+      "  timestamp: 1658378932\n",
+      "  timesteps_since_restore: 0\n",
+      "  training_iteration: 4\n",
+      "  trial_id: 53c58_00000\n",
+      "  warmup_time: 0.003597259521484375\n",
+      "  \n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-25 22:27:16,138\tINFO tune.py:753 -- Total run time: 74.68 seconds (74.45 seconds for the tuning loop).\n",
-      "Map Progress (1 actors 1 pending):   0%|          | 0/1 [00:01<?, ?it/s]\u001b[2m\u001b[36m(BlockWorker pid=2267)\u001b[0m /usr/local/lib/python3.7/dist-packages/torchvision/transforms/functional.py:133: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:178.)\n",
-      "\u001b[2m\u001b[36m(BlockWorker pid=2267)\u001b[0m   img = torch.from_numpy(pic.transpose((2, 0, 1))).contiguous()\n",
-      "Map Progress (2 actors 1 pending): 100%|██████████| 1/1 [00:04<00:00,  4.18s/it]\n",
-      "Map_Batches: 100%|██████████| 1/1 [00:01<00:00,  1.63s/it]\n",
-      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 13.60it/s]\n",
-      "Shuffle Map: 100%|██████████| 1/1 [00:00<00:00, 24.76it/s]\n",
-      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00, 49.17it/s]\n"
+      "2022-07-20 21:48:52,891\tINFO tune.py:738 -- Total run time: 39.80 seconds (39.66 seconds for the tuning loop).\n",
+      "Map Progress (1 actors 1 pending):   0%|          | 0/1 [00:01<?, ?it/s]\u001b[2m\u001b[36m(BlockWorker pid=39601)\u001b[0m /Users/jiaodong/anaconda3/envs/ray3.7/lib/python3.7/site-packages/torchvision/transforms/functional.py:150: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  /Users/runner/work/pytorch/pytorch/pytorch/torch/csrc/utils/tensor_numpy.cpp:178.)\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:03<00:00,  3.01s/it]\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00,  8.70it/s]\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 76.13it/s]\n",
+      "Shuffle Map: 100%|██████████| 1/1 [00:00<00:00, 82.57it/s]\n",
+      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00, 134.32it/s]\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Accuracy for task 1: 0.946\n"
+      "Accuracy for task 1: 0.3767\n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(ServeController pid=2382)\u001b[0m INFO 2022-05-25 22:27:23,467 controller 2382 checkpoint_path.py:17 - Using RayInternalKVStore for controller checkpoint and recovery.\n",
-      "\u001b[2m\u001b[36m(ServeController pid=2382)\u001b[0m INFO 2022-05-25 22:27:23,470 controller 2382 http_state.py:115 - Starting HTTP proxy with name 'SERVE_CONTROLLER_ACTOR:XnXlnS:SERVE_PROXY_ACTOR-node:172.28.0.2-0' on node 'node:172.28.0.2-0' listening on '127.0.0.1:8000'\n",
-      "Shuffle Map:   0%|          | 0/1 [00:00<?, ?it/s]\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO:     Started server process [2415]\n",
-      "Shuffle Map: 100%|██████████| 1/1 [00:01<00:00,  1.40s/it]\n",
-      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00,  7.72it/s]\n",
-      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.18s/it]\n",
-      "\u001b[2m\u001b[36m(ServeController pid=2382)\u001b[0m INFO 2022-05-25 22:27:28,825 controller 2382 deployment_state.py:1219 - Adding 2 replicas to deployment 'mnist_model'.\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:32,954 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 4.8ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:32,977 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 21.4ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:32,985 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 4.4ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2573)\u001b[0m INFO 2022-05-25 22:27:32,976 mnist_model mnist_model#vDEhSp replica.py:483 - HANDLE __call__ OK 15.5ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2573)\u001b[0m INFO 2022-05-25 22:27:32,992 mnist_model mnist_model#vDEhSp replica.py:483 - HANDLE __call__ OK 5.6ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2575)\u001b[0m INFO 2022-05-25 22:27:32,952 mnist_model mnist_model#QdDxIB replica.py:483 - HANDLE __call__ OK 0.4ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2575)\u001b[0m INFO 2022-05-25 22:27:32,982 mnist_model mnist_model#QdDxIB replica.py:483 - HANDLE __call__ OK 0.3ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:32,997 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 11.8ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,008 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 6.1ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,017 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 7.1ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,022 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.3ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,031 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 7.3ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,036 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.3ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,044 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 6.4ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,048 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.3ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,057 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 6.9ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,061 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.2ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,070 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 6.4ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,074 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.3ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,082 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 6.4ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,088 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 3.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2573)\u001b[0m INFO 2022-05-25 22:27:33,016 mnist_model mnist_model#vDEhSp replica.py:483 - HANDLE __call__ OK 4.6ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2573)\u001b[0m INFO 2022-05-25 22:27:33,029 mnist_model mnist_model#vDEhSp replica.py:483 - HANDLE __call__ OK 4.4ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2573)\u001b[0m INFO 2022-05-25 22:27:33,043 mnist_model mnist_model#vDEhSp replica.py:483 - HANDLE __call__ OK 4.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2573)\u001b[0m INFO 2022-05-25 22:27:33,056 mnist_model mnist_model#vDEhSp replica.py:483 - HANDLE __call__ OK 4.6ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2573)\u001b[0m INFO 2022-05-25 22:27:33,068 mnist_model mnist_model#vDEhSp replica.py:483 - HANDLE __call__ OK 4.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2573)\u001b[0m INFO 2022-05-25 22:27:33,081 mnist_model mnist_model#vDEhSp replica.py:483 - HANDLE __call__ OK 4.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2575)\u001b[0m INFO 2022-05-25 22:27:33,007 mnist_model mnist_model#QdDxIB replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2575)\u001b[0m INFO 2022-05-25 22:27:33,021 mnist_model mnist_model#QdDxIB replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2575)\u001b[0m INFO 2022-05-25 22:27:33,035 mnist_model mnist_model#QdDxIB replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2575)\u001b[0m INFO 2022-05-25 22:27:33,047 mnist_model mnist_model#QdDxIB replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2575)\u001b[0m INFO 2022-05-25 22:27:33,060 mnist_model mnist_model#QdDxIB replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2575)\u001b[0m INFO 2022-05-25 22:27:33,073 mnist_model mnist_model#QdDxIB replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2575)\u001b[0m INFO 2022-05-25 22:27:33,086 mnist_model mnist_model#QdDxIB replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,122 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 25.8ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,134 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 3.0ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=2415)\u001b[0m INFO 2022-05-25 22:27:33,142 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 6.6ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2573)\u001b[0m INFO 2022-05-25 22:27:33,117 mnist_model mnist_model#vDEhSp replica.py:483 - HANDLE __call__ OK 14.4ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2573)\u001b[0m INFO 2022-05-25 22:27:33,141 mnist_model mnist_model#vDEhSp replica.py:483 - HANDLE __call__ OK 4.4ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=2575)\u001b[0m INFO 2022-05-25 22:27:33,133 mnist_model mnist_model#QdDxIB replica.py:483 - HANDLE __call__ OK 0.4ms\n",
-      "\u001b[2m\u001b[36m(ServeController pid=2382)\u001b[0m INFO 2022-05-25 22:27:33,225 controller 2382 deployment_state.py:1243 - Removing 2 replicas from deployment 'mnist_model'.\n",
-      "Map Progress (2 actors 1 pending): 100%|██████████| 1/1 [00:02<00:00,  2.58s/it]\n",
-      "\u001b[2m\u001b[36m(_prepare_read pid=2726)\u001b[0m 2022-05-25 22:27:40,353\tWARNING torch_datasource.py:56 -- `SimpleTorchDatasource` doesn't support parallel reads. The `parallelism` argument will be ignored.\n",
-      "Read->Map_Batches: 100%|██████████| 1/1 [00:00<00:00,  2.20it/s]\n",
-      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.41s/it]"
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:48:57,458 controller 39625 checkpoint_path.py:17 - Using RayInternalKVStore for controller checkpoint and recovery.\n",
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:48:57,460 controller 39625 http_state.py:126 - Starting HTTP proxy with name 'SERVE_CONTROLLER_ACTOR:oEzsmU:SERVE_PROXY_ACTOR-db68eafa3bbe9042df574f3c9974b40ce8d97728db90282feefb4690' on node 'db68eafa3bbe9042df574f3c9974b40ce8d97728db90282feefb4690' listening on '127.0.0.1:8000'\n",
+      "Shuffle Map:   0%|          | 0/1 [00:00<?, ?it/s]\u001b[2m\u001b[36m(HTTPProxyActor pid=39628)\u001b[0m INFO:     Started server process [39628]\n",
+      "Shuffle Map: 100%|██████████| 1/1 [00:00<00:00,  8.12it/s]\n",
+      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00,  5.80it/s]\n",
+      "Map Progress (1 actors 0 pending): 100%|██████████| 1/1 [00:01<00:00,  1.16s/it]\n",
+      "/Users/jiaodong/anaconda3/envs/ray3.7/lib/python3.7/site-packages/ipykernel_launcher.py:25: UserWarning: From /var/folders/1s/wy6f3ytn3q726p5hl8fw8d780000gn/T/ipykernel_39344/1249059442.py:25: deploy (from ray.serve.deployment) is deprecated and will be removed in a future version Please see https://docs.ray.io/en/latest/serve/index.html\n",
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:49:00,913 controller 39625 deployment_state.py:1281 - Adding 2 replicas to deployment 'mnist_model'.\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:02<00:00,  2.39s/it]\n",
+      "Read->Map_Batches: 100%|██████████| 1/1 [00:00<00:00,  2.39it/s]\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.37s/it]\n"
      ]
     },
     {
@@ -928,22 +819,15 @@
       "Starting training for task: 1\n"
      ]
     },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "\n"
-     ]
-    },
     {
      "data": {
       "text/html": [
-       "== Status ==<br>Current time: 2022-05-25 22:28:52 (running for 00:01:09.00)<br>Memory usage on this node: 5.0/12.7 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/2 CPUs, 0/1 GPUs, 0.0/7.31 GiB heap, 0.0/3.66 GiB objects (0.0/1.0 accelerator_type:T4)<br>Result logdir: /root/ray_results/TorchTrainer_2022-05-25_22-27-43<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
+       "== Status ==<br>Current time: 2022-07-20 21:50:36 (running for 00:00:37.98)<br>Memory usage on this node: 33.7/64.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/28.14 GiB heap, 0.0/2.0 GiB objects<br>Result logdir: /Users/jiaodong/ray_results/TorchTrainer_2022-07-20_21-49-58<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
        "<thead>\n",
-       "<tr><th>Trial name              </th><th>status    </th><th>loc            </th></tr>\n",
+       "<tr><th>Trial name              </th><th>status    </th><th>loc            </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">   loss</th><th style=\"text-align: right;\">  _timestamp</th><th style=\"text-align: right;\">  _time_this_iter_s</th></tr>\n",
        "</thead>\n",
        "<tbody>\n",
-       "<tr><td>TorchTrainer_e4f66_00000</td><td>TERMINATED</td><td>172.28.0.2:2875</td></tr>\n",
+       "<tr><td>TorchTrainer_92bcd_00000</td><td>TERMINATED</td><td>127.0.0.1:39736</td><td style=\"text-align: right;\">     4</td><td style=\"text-align: right;\">         34.1132</td><td style=\"text-align: right;\">707.634</td><td style=\"text-align: right;\">  1658379035</td><td style=\"text-align: right;\">            6.45643</td></tr>\n",
        "</tbody>\n",
        "</table><br><br>"
       ],
@@ -958,125 +842,105 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(_map_block_nosplit pid=2909)\u001b[0m /usr/local/lib/python3.7/dist-packages/torchvision/transforms/functional.py:133: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:178.)\n",
-      "\u001b[2m\u001b[36m(_map_block_nosplit pid=2909)\u001b[0m   img = torch.from_numpy(pic.transpose((2, 0, 1))).contiguous()\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m 2022-05-25 22:28:01,917\tINFO torch.py:347 -- Setting up process group for: env:// [rank=0, world_size=1]\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m 2022-05-25 22:28:02,063\tINFO torch.py:98 -- Moving model to device: cuda:0\n"
+      "\u001b[2m\u001b[36m(TorchTrainer pid=39736)\u001b[0m 2022-07-20 21:50:01,936\tWARNING base_trainer.py:167 -- When passing `datasets` to a Trainer, it is recommended to reserve at least 20% of node CPUs for Dataset execution by setting `_max_cpu_fraction_per_node = 0.8` in the Trainer `scaling_config`. Not doing so can lead to resource contention or hangs. See https://docs.ray.io/en/master/data/key-concepts.html#example-datasets-in-tune for more info.\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m 2022-07-20 21:50:09,489\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=1]\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m [W ProcessGroupGloo.cpp:715] Warning: Unable to resolve hostname to a (local) address. Using the loopback address as fallback. Manually set the network interface to bind to with GLOO_SOCKET_IFNAME. (function operator())\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 3.347775, epoch: 0, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 1.343975, epoch: 0, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.768560, epoch: 0, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.607410, epoch: 0, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.578952, epoch: 1, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.473788, epoch: 1, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.609530, epoch: 1, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.741895, epoch: 1, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.417272, epoch: 2, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.510404, epoch: 2, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.422137, epoch: 2, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.403623, epoch: 2, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.384720, epoch: 3, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.414567, epoch: 3, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.274302, epoch: 3, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=2948)\u001b[0m loss: 0.348169, epoch: 3, iteration: 1500\n"
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 3.301114, epoch: 0, iteration: 0\n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-25 22:28:52,221\tERROR checkpoint_manager.py:193 -- Result dict has no key: training_iteration. checkpoint_score_attr must be set to a key of the result dict. Valid keys are ['trial_id', 'experiment_id', 'date', 'timestamp', 'pid', 'hostname', 'node_ip', 'config', 'done']\n"
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m 2022-07-20 21:50:09,795\tINFO train_loop_utils.py:298 -- Moving model to device: cpu\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m /Users/jiaodong/Workspace/ray/python/ray/air/_internal/torch_utils.py:64: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  /Users/runner/work/pytorch/pytorch/pytorch/torch/csrc/utils/tensor_numpy.cpp:178.)\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m   return torch.as_tensor(vals, dtype=dtype)\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Trial TorchTrainer_e4f66_00000 completed. Last result: \n"
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 1.075076, epoch: 0, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.536976, epoch: 0, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.600182, epoch: 0, iteration: 1500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.546070, epoch: 1, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.448120, epoch: 1, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.392481, epoch: 1, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.371981, epoch: 1, iteration: 1500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.521735, epoch: 2, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.635850, epoch: 2, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.395862, epoch: 2, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.402500, epoch: 2, iteration: 1500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.236922, epoch: 3, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.528482, epoch: 3, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.372242, epoch: 3, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39752)\u001b[0m loss: 0.355759, epoch: 3, iteration: 1500\n",
+      "Result for TorchTrainer_92bcd_00000:\n",
+      "  _time_this_iter_s: 6.456433057785034\n",
+      "  _timestamp: 1658379035\n",
+      "  _training_iteration: 4\n",
+      "  date: 2022-07-20_21-50-36\n",
+      "  done: true\n",
+      "  experiment_id: 21820161d0a245428cf75b0b9b17fe6e\n",
+      "  experiment_tag: '0'\n",
+      "  hostname: Jiaos-MacBook-Pro-16-inch-2019\n",
+      "  iterations_since_restore: 4\n",
+      "  loss: 707.6341038495302\n",
+      "  node_ip: 127.0.0.1\n",
+      "  pid: 39736\n",
+      "  should_checkpoint: true\n",
+      "  time_since_restore: 34.11321783065796\n",
+      "  time_this_iter_s: 6.463765859603882\n",
+      "  time_total_s: 34.11321783065796\n",
+      "  timestamp: 1658379036\n",
+      "  timesteps_since_restore: 0\n",
+      "  training_iteration: 4\n",
+      "  trial_id: 92bcd_00000\n",
+      "  warmup_time: 0.005189180374145508\n",
+      "  \n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-25 22:28:52,344\tINFO tune.py:753 -- Total run time: 69.20 seconds (68.99 seconds for the tuning loop).\n",
-      "Map Progress (1 actors 1 pending):   0%|          | 0/2 [00:01<?, ?it/s]\u001b[2m\u001b[36m(BlockWorker pid=3027)\u001b[0m /usr/local/lib/python3.7/dist-packages/torchvision/transforms/functional.py:133: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:178.)\n",
-      "\u001b[2m\u001b[36m(BlockWorker pid=3027)\u001b[0m   img = torch.from_numpy(pic.transpose((2, 0, 1))).contiguous()\n",
-      "Map Progress (2 actors 1 pending): 100%|██████████| 2/2 [00:05<00:00,  2.64s/it]\n",
-      "Map_Batches: 100%|██████████| 2/2 [00:01<00:00,  1.07it/s]\n",
-      "Map_Batches: 100%|██████████| 2/2 [00:01<00:00,  1.55it/s]\n",
-      "Shuffle Map: 100%|██████████| 2/2 [00:00<00:00,  3.78it/s]\n",
-      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00, 72.95it/s]\n"
+      "2022-07-20 21:50:36,835\tINFO tune.py:738 -- Total run time: 38.13 seconds (37.98 seconds for the tuning loop).\n",
+      "Map Progress (1 actors 1 pending):   0%|          | 0/2 [00:01<?, ?it/s]\u001b[2m\u001b[36m(BlockWorker pid=39801)\u001b[0m /Users/jiaodong/anaconda3/envs/ray3.7/lib/python3.7/site-packages/torchvision/transforms/functional.py:150: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  /Users/runner/work/pytorch/pytorch/pytorch/torch/csrc/utils/tensor_numpy.cpp:178.)\n",
+      "Map Progress (2 actors 1 pending): 100%|██████████| 2/2 [00:03<00:00,  1.96s/it]\n",
+      "Map_Batches: 100%|██████████| 2/2 [00:00<00:00,  5.28it/s]\n",
+      "Map_Batches: 100%|██████████| 2/2 [00:00<00:00, 114.72it/s]\n",
+      "Shuffle Map: 100%|██████████| 2/2 [00:00<00:00, 162.16it/s]\n",
+      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00, 140.57it/s]\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Accuracy for task 2: 0.9261\n"
+      "Accuracy for task 2: 0.36795\n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(ServeController pid=3209)\u001b[0m INFO 2022-05-25 22:29:02,797 controller 3209 checkpoint_path.py:17 - Using RayInternalKVStore for controller checkpoint and recovery.\n",
-      "\u001b[2m\u001b[36m(ServeController pid=3209)\u001b[0m INFO 2022-05-25 22:29:02,802 controller 3209 http_state.py:115 - Starting HTTP proxy with name 'SERVE_CONTROLLER_ACTOR:lsPTvu:SERVE_PROXY_ACTOR-node:172.28.0.2-0' on node 'node:172.28.0.2-0' listening on '127.0.0.1:8000'\n",
-      "Shuffle Map:   0%|          | 0/1 [00:00<?, ?it/s]\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO:     Started server process [3241]\n",
-      "Shuffle Map: 100%|██████████| 1/1 [00:01<00:00,  1.54s/it]\n",
-      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00,  8.17it/s]\n",
-      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.15s/it]\n",
-      "\u001b[2m\u001b[36m(ServeController pid=3209)\u001b[0m INFO 2022-05-25 22:29:08,327 controller 3209 deployment_state.py:1219 - Adding 2 replicas to deployment 'mnist_model'.\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,440 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 5.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3402)\u001b[0m INFO 2022-05-25 22:29:12,438 mnist_model mnist_model#Egafuf replica.py:483 - HANDLE __call__ OK 0.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3401)\u001b[0m INFO 2022-05-25 22:29:12,460 mnist_model mnist_model#uumYOV replica.py:483 - HANDLE __call__ OK 15.4ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,466 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 24.3ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,471 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.8ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,481 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 7.6ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,487 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 3.9ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,496 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 6.9ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,501 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.3ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,509 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 6.8ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,514 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.6ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,523 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 6.8ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,528 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.3ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,537 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 7.2ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,542 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.5ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,550 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 6.7ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,556 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 3.7ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,564 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 7.0ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3401)\u001b[0m INFO 2022-05-25 22:29:12,480 mnist_model mnist_model#uumYOV replica.py:483 - HANDLE __call__ OK 5.1ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3401)\u001b[0m INFO 2022-05-25 22:29:12,495 mnist_model mnist_model#uumYOV replica.py:483 - HANDLE __call__ OK 4.5ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3401)\u001b[0m INFO 2022-05-25 22:29:12,508 mnist_model mnist_model#uumYOV replica.py:483 - HANDLE __call__ OK 4.6ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3401)\u001b[0m INFO 2022-05-25 22:29:12,522 mnist_model mnist_model#uumYOV replica.py:483 - HANDLE __call__ OK 4.6ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3401)\u001b[0m INFO 2022-05-25 22:29:12,536 mnist_model mnist_model#uumYOV replica.py:483 - HANDLE __call__ OK 4.7ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3401)\u001b[0m INFO 2022-05-25 22:29:12,549 mnist_model mnist_model#uumYOV replica.py:483 - HANDLE __call__ OK 4.4ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3401)\u001b[0m INFO 2022-05-25 22:29:12,563 mnist_model mnist_model#uumYOV replica.py:483 - HANDLE __call__ OK 4.7ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3402)\u001b[0m INFO 2022-05-25 22:29:12,470 mnist_model mnist_model#Egafuf replica.py:483 - HANDLE __call__ OK 0.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3402)\u001b[0m INFO 2022-05-25 22:29:12,485 mnist_model mnist_model#Egafuf replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3402)\u001b[0m INFO 2022-05-25 22:29:12,500 mnist_model mnist_model#Egafuf replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3402)\u001b[0m INFO 2022-05-25 22:29:12,513 mnist_model mnist_model#Egafuf replica.py:483 - HANDLE __call__ OK 0.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3402)\u001b[0m INFO 2022-05-25 22:29:12,527 mnist_model mnist_model#Egafuf replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3402)\u001b[0m INFO 2022-05-25 22:29:12,540 mnist_model mnist_model#Egafuf replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3402)\u001b[0m INFO 2022-05-25 22:29:12,554 mnist_model mnist_model#Egafuf replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,586 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 4.6ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,596 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 9.3ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,601 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.7ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=3241)\u001b[0m INFO 2022-05-25 22:29:12,610 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 7.0ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3401)\u001b[0m INFO 2022-05-25 22:29:12,594 mnist_model mnist_model#uumYOV replica.py:483 - HANDLE __call__ OK 6.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3401)\u001b[0m INFO 2022-05-25 22:29:12,609 mnist_model mnist_model#uumYOV replica.py:483 - HANDLE __call__ OK 4.6ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3402)\u001b[0m INFO 2022-05-25 22:29:12,583 mnist_model mnist_model#Egafuf replica.py:483 - HANDLE __call__ OK 0.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=3402)\u001b[0m INFO 2022-05-25 22:29:12,600 mnist_model mnist_model#Egafuf replica.py:483 - HANDLE __call__ OK 0.3ms\n",
-      "\u001b[2m\u001b[36m(ServeController pid=3209)\u001b[0m INFO 2022-05-25 22:29:12,699 controller 3209 deployment_state.py:1243 - Removing 2 replicas from deployment 'mnist_model'.\n",
-      "Map Progress (2 actors 1 pending): 100%|██████████| 1/1 [00:02<00:00,  2.56s/it]\n",
-      "\u001b[2m\u001b[36m(_prepare_read pid=3556)\u001b[0m 2022-05-25 22:29:19,825\tWARNING torch_datasource.py:56 -- `SimpleTorchDatasource` doesn't support parallel reads. The `parallelism` argument will be ignored.\n",
-      "Read->Map_Batches: 100%|██████████| 1/1 [00:00<00:00,  2.44it/s]\n",
-      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.41s/it]"
+      "Shuffle Map: 100%|██████████| 1/1 [00:00<00:00,  6.24it/s]\n",
+      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00,  6.19it/s]\n",
+      "Map Progress (1 actors 0 pending): 100%|██████████| 1/1 [00:01<00:00,  1.18s/it]\n",
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:50:42,924 controller 39625 deployment_state.py:1240 - Stopping 1 replicas of deployment 'mnist_model' with outdated versions.\n",
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:50:45,044 controller 39625 deployment_state.py:1281 - Adding 1 replicas to deployment 'mnist_model'.\n",
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:50:47,377 controller 39625 deployment_state.py:1240 - Stopping 1 replicas of deployment 'mnist_model' with outdated versions.\n",
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:50:49,504 controller 39625 deployment_state.py:1281 - Adding 1 replicas to deployment 'mnist_model'.\n",
+      "Map Progress (2 actors 0 pending): 100%|██████████| 1/1 [00:02<00:00,  2.36s/it]\n",
+      "Read->Map_Batches: 100%|██████████| 1/1 [00:00<00:00,  2.04it/s]\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.37s/it]\n"
      ]
     },
     {
@@ -1086,22 +950,15 @@
       "Starting training for task: 2\n"
      ]
     },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "\n"
-     ]
-    },
     {
      "data": {
       "text/html": [
-       "== Status ==<br>Current time: 2022-05-25 22:30:31 (running for 00:01:09.12)<br>Memory usage on this node: 5.0/12.7 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/2 CPUs, 0/1 GPUs, 0.0/7.31 GiB heap, 0.0/3.66 GiB objects (0.0/1.0 accelerator_type:T4)<br>Result logdir: /root/ray_results/TorchTrainer_2022-05-25_22-29-22<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
+       "== Status ==<br>Current time: 2022-07-20 21:52:25 (running for 00:00:37.97)<br>Memory usage on this node: 34.0/64.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/28.14 GiB heap, 0.0/2.0 GiB objects<br>Result logdir: /Users/jiaodong/ray_results/TorchTrainer_2022-07-20_21-51-47<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
        "<thead>\n",
-       "<tr><th>Trial name              </th><th>status    </th><th>loc            </th></tr>\n",
+       "<tr><th>Trial name              </th><th>status    </th><th>loc            </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">   loss</th><th style=\"text-align: right;\">  _timestamp</th><th style=\"text-align: right;\">  _time_this_iter_s</th></tr>\n",
        "</thead>\n",
        "<tbody>\n",
-       "<tr><td>TorchTrainer_2040e_00000</td><td>TERMINATED</td><td>172.28.0.2:3703</td></tr>\n",
+       "<tr><td>TorchTrainer_d37db_00000</td><td>TERMINATED</td><td>127.0.0.1:39948</td><td style=\"text-align: right;\">     4</td><td style=\"text-align: right;\">         34.0141</td><td style=\"text-align: right;\">671.998</td><td style=\"text-align: right;\">  1658379144</td><td style=\"text-align: right;\">            6.59292</td></tr>\n",
        "</tbody>\n",
        "</table><br><br>"
       ],
@@ -1116,123 +973,89 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(_map_block_nosplit pid=3738)\u001b[0m /usr/local/lib/python3.7/dist-packages/torchvision/transforms/functional.py:133: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:178.)\n",
-      "\u001b[2m\u001b[36m(_map_block_nosplit pid=3738)\u001b[0m   img = torch.from_numpy(pic.transpose((2, 0, 1))).contiguous()\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m 2022-05-25 22:29:41,392\tINFO torch.py:347 -- Setting up process group for: env:// [rank=0, world_size=1]\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m 2022-05-25 22:29:41,549\tINFO torch.py:98 -- Moving model to device: cuda:0\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 4.353125, epoch: 0, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 1.147782, epoch: 0, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.609233, epoch: 0, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.606812, epoch: 0, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.494777, epoch: 1, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.776362, epoch: 1, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.376833, epoch: 1, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.478181, epoch: 1, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.413856, epoch: 2, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.668218, epoch: 2, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.318078, epoch: 2, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.427121, epoch: 2, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.369263, epoch: 3, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.479945, epoch: 3, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.457482, epoch: 3, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=3778)\u001b[0m loss: 0.318416, epoch: 3, iteration: 1500\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2022-05-25 22:30:31,831\tERROR checkpoint_manager.py:193 -- Result dict has no key: training_iteration. checkpoint_score_attr must be set to a key of the result dict. Valid keys are ['trial_id', 'experiment_id', 'date', 'timestamp', 'pid', 'hostname', 'node_ip', 'config', 'done']\n"
+      "\u001b[2m\u001b[36m(TorchTrainer pid=39948)\u001b[0m 2022-07-20 21:51:50,596\tWARNING base_trainer.py:167 -- When passing `datasets` to a Trainer, it is recommended to reserve at least 20% of node CPUs for Dataset execution by setting `_max_cpu_fraction_per_node = 0.8` in the Trainer `scaling_config`. Not doing so can lead to resource contention or hangs. See https://docs.ray.io/en/master/data/key-concepts.html#example-datasets-in-tune for more info.\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m 2022-07-20 21:51:58,118\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=1]\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m [W ProcessGroupGloo.cpp:715] Warning: Unable to resolve hostname to a (local) address. Using the loopback address as fallback. Manually set the network interface to bind to with GLOO_SOCKET_IFNAME. (function operator())\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m 2022-07-20 21:51:58,367\tINFO train_loop_utils.py:298 -- Moving model to device: cpu\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Trial TorchTrainer_2040e_00000 completed. Last result: \n"
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 4.062408, epoch: 0, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.970063, epoch: 0, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.658269, epoch: 0, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.442650, epoch: 0, iteration: 1500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.603212, epoch: 1, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.534739, epoch: 1, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.420072, epoch: 1, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.351545, epoch: 1, iteration: 1500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.347010, epoch: 2, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.419703, epoch: 2, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.350773, epoch: 2, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.231652, epoch: 2, iteration: 1500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.343125, epoch: 3, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.547853, epoch: 3, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.353915, epoch: 3, iteration: 1000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=39968)\u001b[0m loss: 0.260028, epoch: 3, iteration: 1500\n",
+      "Result for TorchTrainer_d37db_00000:\n",
+      "  _time_this_iter_s: 6.5929179191589355\n",
+      "  _timestamp: 1658379144\n",
+      "  _training_iteration: 4\n",
+      "  date: 2022-07-20_21-52-24\n",
+      "  done: true\n",
+      "  experiment_id: 5d41bf13ba524c528faac8f64b13c7cc\n",
+      "  experiment_tag: '0'\n",
+      "  hostname: Jiaos-MacBook-Pro-16-inch-2019\n",
+      "  iterations_since_restore: 4\n",
+      "  loss: 671.9976235236973\n",
+      "  node_ip: 127.0.0.1\n",
+      "  pid: 39948\n",
+      "  should_checkpoint: true\n",
+      "  time_since_restore: 34.01405596733093\n",
+      "  time_this_iter_s: 6.590774774551392\n",
+      "  time_total_s: 34.01405596733093\n",
+      "  timestamp: 1658379144\n",
+      "  timesteps_since_restore: 0\n",
+      "  training_iteration: 4\n",
+      "  trial_id: d37db_00000\n",
+      "  warmup_time: 0.005116939544677734\n",
+      "  \n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-25 22:30:31,953\tINFO tune.py:753 -- Total run time: 69.33 seconds (69.12 seconds for the tuning loop).\n",
-      "Map Progress (1 actors 1 pending):   0%|          | 0/3 [00:01<?, ?it/s]\u001b[2m\u001b[36m(BlockWorker pid=3857)\u001b[0m /usr/local/lib/python3.7/dist-packages/torchvision/transforms/functional.py:133: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:178.)\n",
-      "\u001b[2m\u001b[36m(BlockWorker pid=3857)\u001b[0m   img = torch.from_numpy(pic.transpose((2, 0, 1))).contiguous()\n",
-      "Map Progress (2 actors 1 pending):  33%|███▎      | 1/3 [00:04<00:08,  4.24s/it]\u001b[2m\u001b[36m(BlockWorker pid=3886)\u001b[0m /usr/local/lib/python3.7/dist-packages/torchvision/transforms/functional.py:133: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:178.)\n",
-      "\u001b[2m\u001b[36m(BlockWorker pid=3886)\u001b[0m   img = torch.from_numpy(pic.transpose((2, 0, 1))).contiguous()\n",
-      "Map Progress (2 actors 1 pending): 100%|██████████| 3/3 [00:06<00:00,  2.16s/it]\n",
-      "Map_Batches: 100%|██████████| 3/3 [00:01<00:00,  1.53it/s]\n",
-      "Map_Batches: 100%|██████████| 3/3 [00:00<00:00, 19.25it/s]\n",
-      "Shuffle Map: 100%|██████████| 3/3 [00:00<00:00, 97.56it/s]\n",
-      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00, 64.24it/s]\n"
+      "2022-07-20 21:52:25,471\tINFO tune.py:738 -- Total run time: 38.13 seconds (37.97 seconds for the tuning loop).\n",
+      "Map Progress (1 actors 1 pending):   0%|          | 0/3 [00:01<?, ?it/s]\u001b[2m\u001b[36m(BlockWorker pid=40038)\u001b[0m /Users/jiaodong/anaconda3/envs/ray3.7/lib/python3.7/site-packages/torchvision/transforms/functional.py:150: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  /Users/runner/work/pytorch/pytorch/pytorch/torch/csrc/utils/tensor_numpy.cpp:178.)\n",
+      "Map Progress (2 actors 1 pending): 100%|██████████| 3/3 [00:04<00:00,  1.62s/it]\n",
+      "Map_Batches: 100%|██████████| 3/3 [00:00<00:00,  7.77it/s]\n",
+      "Map_Batches: 100%|██████████| 3/3 [00:00<00:00, 136.51it/s]\n",
+      "Shuffle Map: 100%|██████████| 3/3 [00:00<00:00, 216.98it/s]\n",
+      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00, 135.98it/s]\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Accuracy for task 3: 0.9001333333333333\n"
+      "Accuracy for task 3: 0.3590333333333333\n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(ServeController pid=4011)\u001b[0m INFO 2022-05-25 22:30:43,081 controller 4011 checkpoint_path.py:17 - Using RayInternalKVStore for controller checkpoint and recovery.\n",
-      "\u001b[2m\u001b[36m(ServeController pid=4011)\u001b[0m INFO 2022-05-25 22:30:43,084 controller 4011 http_state.py:115 - Starting HTTP proxy with name 'SERVE_CONTROLLER_ACTOR:viEsyL:SERVE_PROXY_ACTOR-node:172.28.0.2-0' on node 'node:172.28.0.2-0' listening on '127.0.0.1:8000'\n",
-      "Shuffle Map:   0%|          | 0/1 [00:00<?, ?it/s]\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO:     Started server process [4043]\n",
-      "Shuffle Map: 100%|██████████| 1/1 [00:01<00:00,  1.61s/it]\n",
-      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00,  7.16it/s]\n",
-      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.36s/it]\n",
-      "\u001b[2m\u001b[36m(ServeController pid=4011)\u001b[0m INFO 2022-05-25 22:30:48,663 controller 4011 deployment_state.py:1219 - Adding 2 replicas to deployment 'mnist_model'.\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,754 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 5.0ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,771 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 15.8ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,777 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 3.1ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,788 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 9.0ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,794 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 3.5ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,803 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 7.0ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,808 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.5ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,817 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 7.2ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,822 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.6ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4199)\u001b[0m INFO 2022-05-25 22:30:52,770 mnist_model mnist_model#kzOVuE replica.py:483 - HANDLE __call__ OK 11.5ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4199)\u001b[0m INFO 2022-05-25 22:30:52,787 mnist_model mnist_model#kzOVuE replica.py:483 - HANDLE __call__ OK 6.1ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4199)\u001b[0m INFO 2022-05-25 22:30:52,802 mnist_model mnist_model#kzOVuE replica.py:483 - HANDLE __call__ OK 4.8ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4199)\u001b[0m INFO 2022-05-25 22:30:52,815 mnist_model mnist_model#kzOVuE replica.py:483 - HANDLE __call__ OK 4.6ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4200)\u001b[0m INFO 2022-05-25 22:30:52,752 mnist_model mnist_model#QFllkk replica.py:483 - HANDLE __call__ OK 0.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4200)\u001b[0m INFO 2022-05-25 22:30:52,776 mnist_model mnist_model#QFllkk replica.py:483 - HANDLE __call__ OK 0.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4200)\u001b[0m INFO 2022-05-25 22:30:52,793 mnist_model mnist_model#QFllkk replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4200)\u001b[0m INFO 2022-05-25 22:30:52,807 mnist_model mnist_model#QFllkk replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4200)\u001b[0m INFO 2022-05-25 22:30:52,821 mnist_model mnist_model#QFllkk replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,848 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 24.9ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,853 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.6ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,869 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 13.4ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4199)\u001b[0m INFO 2022-05-25 22:30:52,847 mnist_model mnist_model#kzOVuE replica.py:483 - HANDLE __call__ OK 8.4ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4199)\u001b[0m INFO 2022-05-25 22:30:52,867 mnist_model mnist_model#kzOVuE replica.py:483 - HANDLE __call__ OK 6.6ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4200)\u001b[0m INFO 2022-05-25 22:30:52,852 mnist_model mnist_model#QFllkk replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,984 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 3.5ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:52,995 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 9.0ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:53,001 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 3.4ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:53,011 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 8.1ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:53,016 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.7ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:53,025 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 7.4ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:53,030 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 307 2.5ms\n",
-      "\u001b[2m\u001b[36m(HTTPProxyActor pid=4043)\u001b[0m INFO 2022-05-25 22:30:53,045 http_proxy 172.28.0.2 http_proxy.py:320 - POST /mnist_predict 200 11.9ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4199)\u001b[0m INFO 2022-05-25 22:30:52,993 mnist_model mnist_model#kzOVuE replica.py:483 - HANDLE __call__ OK 5.9ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4199)\u001b[0m INFO 2022-05-25 22:30:53,010 mnist_model mnist_model#kzOVuE replica.py:483 - HANDLE __call__ OK 5.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4199)\u001b[0m INFO 2022-05-25 22:30:53,024 mnist_model mnist_model#kzOVuE replica.py:483 - HANDLE __call__ OK 4.9ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4199)\u001b[0m INFO 2022-05-25 22:30:53,043 mnist_model mnist_model#kzOVuE replica.py:483 - HANDLE __call__ OK 4.9ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4200)\u001b[0m INFO 2022-05-25 22:30:52,982 mnist_model mnist_model#QFllkk replica.py:483 - HANDLE __call__ OK 0.3ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4200)\u001b[0m INFO 2022-05-25 22:30:52,999 mnist_model mnist_model#QFllkk replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4200)\u001b[0m INFO 2022-05-25 22:30:53,015 mnist_model mnist_model#QFllkk replica.py:483 - HANDLE __call__ OK 0.2ms\n",
-      "\u001b[2m\u001b[36m(mnist_model pid=4200)\u001b[0m INFO 2022-05-25 22:30:53,029 mnist_model mnist_model#QFllkk replica.py:483 - HANDLE __call__ OK 0.3ms\n",
-      "\u001b[2m\u001b[36m(ServeController pid=4011)\u001b[0m INFO 2022-05-25 22:30:53,125 controller 4011 deployment_state.py:1243 - Removing 2 replicas from deployment 'mnist_model'.\n"
+      "Shuffle Map: 100%|██████████| 1/1 [00:00<00:00,  6.01it/s]\n",
+      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00,  6.26it/s]\n",
+      "Map Progress (1 actors 0 pending): 100%|██████████| 1/1 [00:01<00:00,  1.17s/it]\n",
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:52:32,498 controller 39625 deployment_state.py:1240 - Stopping 1 replicas of deployment 'mnist_model' with outdated versions.\n",
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:52:34,634 controller 39625 deployment_state.py:1281 - Adding 1 replicas to deployment 'mnist_model'.\n",
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:52:36,956 controller 39625 deployment_state.py:1240 - Stopping 1 replicas of deployment 'mnist_model' with outdated versions.\n",
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:52:39,078 controller 39625 deployment_state.py:1281 - Adding 1 replicas to deployment 'mnist_model'.\n",
+      "\u001b[2m\u001b[36m(ServeController pid=39625)\u001b[0m INFO 2022-07-20 21:53:31,642 controller 39625 deployment_state.py:1304 - Removing 2 replicas from deployment 'mnist_model'.\n"
      ]
     }
    ],
@@ -1258,7 +1081,7 @@
     "# Number of data parallel workers to use for training.\n",
     "num_workers = 1\n",
     "# Whether to use GPU or not.\n",
-    "use_gpu = True\n",
+    "use_gpu = False\n",
     "\n",
     "permuted_mnist = PermutedMNISTStream(n_tasks=n_tasks)\n",
     "train_stream = permuted_mnist.generate_train_stream()\n",
@@ -1352,7 +1175,7 @@
     {
      "data": {
       "text/plain": [
-       "[0.946, 0.9261, 0.9001333333333333]"
+       "[0.3767, 0.36795, 0.3590333333333333]"
       ]
      },
      "execution_count": 11,
@@ -1388,7 +1211,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 12,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/"
@@ -1401,26 +1224,11 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "Map Progress (2 actors 1 pending): 100%|██████████| 1/1 [00:02<00:00,  2.93s/it]\n",
-      "Map Progress (2 actors 1 pending): 100%|██████████| 1/1 [00:03<00:00,  3.11s/it]\n",
-      "Map Progress:   0%|          | 0/1 [00:00<?, ?it/s]"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\u001b[2m\u001b[1m\u001b[36m(scheduler +8m58s)\u001b[0m Tip: use `ray status` to view detailed cluster status. To disable these messages, set RAY_SCHEDULER_EVENTS=0.\n",
-      "\u001b[2m\u001b[1m\u001b[33m(scheduler +8m58s)\u001b[0m Warning: The following resource request cannot be scheduled right now: {'CPU': 1.0}. This is likely due to all cluster resources being claimed by actors. Consider creating fewer actors or adding more nodes to this Ray cluster.\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "Map Progress (2 actors 1 pending): 100%|██████████| 1/1 [00:03<00:00,  3.06s/it]\n",
-      "Shuffle Map: 100%|██████████| 3/3 [00:04<00:00,  1.64s/it]\n",
-      "Shuffle Reduce: 100%|██████████| 3/3 [00:02<00:00,  1.07it/s]\n"
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:02<00:00,  2.33s/it]\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:02<00:00,  2.32s/it]\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:02<00:00,  2.31s/it]\n",
+      "Shuffle Map: 100%|██████████| 3/3 [00:01<00:00,  2.55it/s]\n",
+      "Shuffle Reduce: 100%|██████████| 3/3 [00:01<00:00,  2.55it/s]\n"
      ]
     }
    ],
@@ -1448,7 +1256,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 13,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/",
@@ -1458,15 +1266,22 @@
     "outputId": "653b4dfc-ed47-4307-fa84-e4c4ea3ec354"
    },
    "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "2022-07-20 21:53:44,223\tWARNING base_trainer.py:167 -- When passing `datasets` to a Trainer, it is recommended to reserve at least 20% of node CPUs for Dataset execution by setting `_max_cpu_fraction_per_node = 0.8` in the Trainer `scaling_config`. Not doing so can lead to resource contention or hangs. See https://docs.ray.io/en/master/data/key-concepts.html#example-datasets-in-tune for more info.\n"
+     ]
+    },
     {
      "data": {
       "text/html": [
-       "== Status ==<br>Current time: 2022-05-18 23:52:49 (running for 00:03:27.40)<br>Memory usage on this node: 7.0/12.7 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/2 CPUs, 0/1 GPUs, 0.0/7.34 GiB heap, 0.0/3.67 GiB objects (0.0/1.0 accelerator_type:T4)<br>Result logdir: /root/ray_results/TorchTrainer_2022-05-18_23-49-22<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
+       "== Status ==<br>Current time: 2022-07-20 21:55:10 (running for 00:01:25.89)<br>Memory usage on this node: 34.4/64.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/28.14 GiB heap, 0.0/2.0 GiB objects<br>Result logdir: /Users/jiaodong/ray_results/TorchTrainer_2022-07-20_21-53-44<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
        "<thead>\n",
-       "<tr><th>Trial name              </th><th>status    </th><th>loc            </th></tr>\n",
+       "<tr><th>Trial name              </th><th>status    </th><th>loc            </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  loss</th><th style=\"text-align: right;\">  _timestamp</th><th style=\"text-align: right;\">  _time_this_iter_s</th></tr>\n",
        "</thead>\n",
        "<tbody>\n",
-       "<tr><td>TorchTrainer_24496_00000</td><td>TERMINATED</td><td>172.28.0.2:4630</td></tr>\n",
+       "<tr><td>TorchTrainer_1923b_00000</td><td>TERMINATED</td><td>127.0.0.1:40228</td><td style=\"text-align: right;\">     4</td><td style=\"text-align: right;\">         82.7285</td><td style=\"text-align: right;\">2328.8</td><td style=\"text-align: right;\">  1658379309</td><td style=\"text-align: right;\">            17.0239</td></tr>\n",
        "</tbody>\n",
        "</table><br><br>"
       ],
@@ -1481,85 +1296,59 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(_map_block_nosplit pid=4666)\u001b[0m /usr/local/lib/python3.7/dist-packages/torchvision/transforms/functional.py:133: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:178.)\n",
-      "\u001b[2m\u001b[36m(_map_block_nosplit pid=4666)\u001b[0m   img = torch.from_numpy(pic.transpose((2, 0, 1))).contiguous()\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m 2022-05-18 23:50:06,950\tINFO torch.py:347 -- Setting up process group for: env:// [rank=0, world_size=1]\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m 2022-05-18 23:50:07,011\tINFO torch.py:98 -- Moving model to device: cuda:0\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 2.373475, epoch: 0, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 1.699985, epoch: 0, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 1.636039, epoch: 0, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 1.334987, epoch: 0, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 1.152312, epoch: 0, iteration: 2000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.998297, epoch: 0, iteration: 2500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 1.434949, epoch: 0, iteration: 3000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.971171, epoch: 0, iteration: 3500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.796480, epoch: 0, iteration: 4000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.802282, epoch: 0, iteration: 4500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.731363, epoch: 0, iteration: 5000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.847772, epoch: 0, iteration: 5500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.879676, epoch: 1, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.564319, epoch: 1, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.714444, epoch: 1, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.565163, epoch: 1, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.739525, epoch: 1, iteration: 2000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.510878, epoch: 1, iteration: 2500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.814798, epoch: 1, iteration: 3000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.473765, epoch: 1, iteration: 3500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.557866, epoch: 1, iteration: 4000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.674371, epoch: 1, iteration: 4500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.532800, epoch: 1, iteration: 5000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.832442, epoch: 1, iteration: 5500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.557547, epoch: 2, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.355255, epoch: 2, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.426749, epoch: 2, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.484543, epoch: 2, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.360856, epoch: 2, iteration: 2000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.444718, epoch: 2, iteration: 2500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.596777, epoch: 2, iteration: 3000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.289816, epoch: 2, iteration: 3500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.407941, epoch: 2, iteration: 4000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.438239, epoch: 2, iteration: 4500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.379983, epoch: 2, iteration: 5000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.527786, epoch: 2, iteration: 5500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.598584, epoch: 3, iteration: 0\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.355202, epoch: 3, iteration: 500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.392683, epoch: 3, iteration: 1000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.415264, epoch: 3, iteration: 1500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.417230, epoch: 3, iteration: 2000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.289974, epoch: 3, iteration: 2500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.648514, epoch: 3, iteration: 3000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.369468, epoch: 3, iteration: 3500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.378548, epoch: 3, iteration: 4000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.392761, epoch: 3, iteration: 4500\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.555575, epoch: 3, iteration: 5000\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=4709)\u001b[0m loss: 0.394487, epoch: 3, iteration: 5500\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2022-05-18 23:52:49,915\tERROR checkpoint_manager.py:193 -- Result dict has no key: training_iteration. checkpoint_score_attr must be set to a key of the result dict. Valid keys are ['trial_id', 'experiment_id', 'date', 'timestamp', 'pid', 'hostname', 'node_ip', 'config', 'done']\n"
+      "\u001b[2m\u001b[36m(TorchTrainer pid=40228)\u001b[0m 2022-07-20 21:53:47,328\tWARNING base_trainer.py:167 -- When passing `datasets` to a Trainer, it is recommended to reserve at least 20% of node CPUs for Dataset execution by setting `_max_cpu_fraction_per_node = 0.8` in the Trainer `scaling_config`. Not doing so can lead to resource contention or hangs. See https://docs.ray.io/en/master/data/key-concepts.html#example-datasets-in-tune for more info.\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Trial TorchTrainer_24496_00000 completed. Last result: \n"
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 2.305423, epoch: 0, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 1.935424, epoch: 0, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 1.174222, epoch: 0, iteration: 5000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.776577, epoch: 0, iteration: 5500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.674814, epoch: 1, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.699747, epoch: 1, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.795673, epoch: 1, iteration: 5000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.651217, epoch: 1, iteration: 5500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.743072, epoch: 2, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.745054, epoch: 2, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.639829, epoch: 2, iteration: 5000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.682482, epoch: 2, iteration: 5500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.553197, epoch: 3, iteration: 0\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.471037, epoch: 3, iteration: 500\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.538055, epoch: 3, iteration: 5000\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=40276)\u001b[0m loss: 0.534079, epoch: 3, iteration: 5500\n",
+      "Result for TorchTrainer_1923b_00000:\n",
+      "  _time_this_iter_s: 17.023871898651123\n",
+      "  _timestamp: 1658379309\n",
+      "  _training_iteration: 4\n",
+      "  date: 2022-07-20_21-55-10\n",
+      "  done: true\n",
+      "  experiment_id: d304983bfe3f4e269118f8618aa9b02f\n",
+      "  experiment_tag: '0'\n",
+      "  hostname: Jiaos-MacBook-Pro-16-inch-2019\n",
+      "  iterations_since_restore: 4\n",
+      "  loss: 2328.8038033917546\n",
+      "  node_ip: 127.0.0.1\n",
+      "  pid: 40228\n",
+      "  should_checkpoint: true\n",
+      "  time_since_restore: 82.72845268249512\n",
+      "  time_this_iter_s: 17.024354696273804\n",
+      "  time_total_s: 82.72845268249512\n",
+      "  timestamp: 1658379310\n",
+      "  timesteps_since_restore: 0\n",
+      "  training_iteration: 4\n",
+      "  trial_id: 1923b_00000\n",
+      "  warmup_time: 0.004433870315551758\n",
+      "  \n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-18 23:52:50,042\tINFO tune.py:753 -- Total run time: 207.53 seconds (207.39 seconds for the tuning loop).\n"
+      "2022-07-20 21:55:10,233\tINFO tune.py:738 -- Total run time: 86.00 seconds (85.88 seconds for the tuning loop).\n"
      ]
     }
    ],
@@ -1593,7 +1382,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 14,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/"
@@ -1606,13 +1395,12 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "Map Progress (1 actors 1 pending):   0%|          | 0/3 [00:01<?, ?it/s]\u001b[2m\u001b[36m(BlockWorker pid=4840)\u001b[0m /usr/local/lib/python3.7/dist-packages/torchvision/transforms/functional.py:133: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:178.)\n",
-      "\u001b[2m\u001b[36m(BlockWorker pid=4840)\u001b[0m   img = torch.from_numpy(pic.transpose((2, 0, 1))).contiguous()\n",
-      "Map Progress (2 actors 1 pending): 100%|██████████| 3/3 [00:06<00:00,  2.25s/it]\n",
-      "Map Progress: 100%|██████████| 3/3 [00:01<00:00,  1.51it/s]\n",
-      "Map Progress: 100%|██████████| 3/3 [00:01<00:00,  1.94it/s]\n",
-      "Shuffle Map: 100%|██████████| 3/3 [00:00<00:00,  5.53it/s]\n",
-      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00, 65.42it/s]\n"
+      "Map Progress (1 actors 1 pending):   0%|          | 0/3 [00:01<?, ?it/s]\u001b[2m\u001b[36m(BlockWorker pid=40400)\u001b[0m /Users/jiaodong/anaconda3/envs/ray3.7/lib/python3.7/site-packages/torchvision/transforms/functional.py:150: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  /Users/runner/work/pytorch/pytorch/pytorch/torch/csrc/utils/tensor_numpy.cpp:178.)\n",
+      "Map Progress (2 actors 1 pending): 100%|██████████| 3/3 [00:04<00:00,  1.62s/it]\n",
+      "Map_Batches: 100%|██████████| 3/3 [00:00<00:00, 63.30it/s]\n",
+      "Map_Batches: 100%|██████████| 3/3 [00:00<00:00, 129.65it/s]\n",
+      "Shuffle Map: 100%|██████████| 3/3 [00:00<00:00, 312.18it/s]\n",
+      "Shuffle Reduce: 100%|██████████| 1/1 [00:00<00:00, 149.25it/s]\n"
      ]
     }
    ],
@@ -1634,7 +1422,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 15,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/"
@@ -1647,8 +1435,8 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Fully trained model accuracy:  0.9468\n",
-      "Incrementally trained model accuracy:  0.9207666666666666\n"
+      "Fully trained model accuracy:  0.38016666666666665\n",
+      "Incrementally trained model accuracy:  0.3590333333333333\n"
      ]
     }
    ],
@@ -1671,15 +1459,6 @@
     "\n",
     "\n"
    ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "id": "2GdLZD4od3oI"
-   },
-   "outputs": [],
-   "source": []
   }
  ],
  "metadata": {
@@ -1690,7 +1469,7 @@
    "provenance": []
   },
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "Python 3.7.10 ('ray3.7')",
    "language": "python",
    "name": "python3"
   },
@@ -1704,7 +1483,12 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.6"
+   "version": "3.7.10"
+  },
+  "vscode": {
+   "interpreter": {
+    "hash": "99d89bfe98f3aa2d7facda0d08d31ff2a0af9559e5330d719288ce64a1966273"
+   }
   }
  },
  "nbformat": 4,
diff --git a/python/ray/data/extensions/__init__.py b/python/ray/data/extensions/__init__.py
index a9ae87faeb02..70b4daedd328 100644
--- a/python/ray/data/extensions/__init__.py
+++ b/python/ray/data/extensions/__init__.py
@@ -1,6 +1,7 @@
 from ray.data.extensions.tensor_extension import (
     TensorDtype,
     TensorArray,
+    TensorArrayElement,
     ArrowTensorType,
     ArrowTensorArray,
 )
@@ -9,6 +10,7 @@
     # Tensor array extension.
     "TensorDtype",
     "TensorArray",
+    "TensorArrayElement",
     "ArrowTensorType",
     "ArrowTensorArray",
 ]
diff --git a/python/ray/data/extensions/tensor_extension.py b/python/ray/data/extensions/tensor_extension.py
index 0fa577250a83..96b868bb47f5 100644
--- a/python/ray/data/extensions/tensor_extension.py
+++ b/python/ray/data/extensions/tensor_extension.py
@@ -1,6 +1,7 @@
 from ray.air.util.tensor_extensions.pandas import (  # noqa: F401
     TensorDtype,
     TensorArray,
+    TensorArrayElement,
 )
 from ray.air.util.tensor_extensions.arrow import (  # noqa: F401
     ArrowTensorType,
diff --git a/python/ray/serve/air_integrations.py b/python/ray/serve/air_integrations.py
index d3868763d683..ddf87c268c0a 100644
--- a/python/ray/serve/air_integrations.py
+++ b/python/ray/serve/air_integrations.py
@@ -45,6 +45,23 @@ def _load_predictor_cls(
     return predictor_cls
 
 
+def _unpack_tensorarray_from_pandas(output_df: "pd.DataFrame") -> "pd.DataFrame":
+    """Unpack predictor's return value with TensorArray into numpy.
+
+    In dl_predictor.py we return a pd.DataFrame that could have multiple
+    columns but value of each column is a TensorArray. Flatten the
+    TensorArray to list to ensure output is json serializable as http
+    response.
+    """
+    from ray.data.extensions import TensorArray, TensorArrayElement
+
+    for col in output_df:
+        if isinstance(output_df[col].values, (TensorArray, TensorArrayElement)):
+            output_df[col] = output_df[col].to_numpy()
+
+    return output_df
+
+
 class BatchingManager:
     """A collection of utilities for batching and splitting data."""
 
@@ -91,6 +108,9 @@ def split_dataframe(
                 f"The output dataframe should have length divisible by {batch_size}, "
                 f"but Serve got length {len(output_df)}."
             )
+
+        output_df = _unpack_tensorarray_from_pandas(output_df)
+
         return [df.reset_index(drop=True) for df in np.split(output_df, batch_size)]
 
     @staticmethod
@@ -200,6 +220,8 @@ async def predict_impl(inp: Union[np.ndarray, "pd.DataFrame"]):
                 out = self.model.predict(inp, **predict_kwargs)
                 if isinstance(out, ray.ObjectRef):
                     out = await out
+                elif pd is not None and isinstance(out, pd.DataFrame):
+                    out = _unpack_tensorarray_from_pandas(out)
                 return out
 
         else:
diff --git a/python/ray/serve/tests/test_air_integrations.py b/python/ray/serve/tests/test_air_integrations.py
index 26bd6f8a39c9..b0a222a69879 100644
--- a/python/ray/serve/tests/test_air_integrations.py
+++ b/python/ray/serve/tests/test_air_integrations.py
@@ -16,6 +16,7 @@
 from ray.serve.deployment_graph_build import build
 from ray.serve.http_adapters import json_to_ndarray
 from ray.train.predictor import DataBatchType, Predictor
+from ray.data.extensions import TensorArray
 
 
 class TestBatchingFunctionFunctions:
@@ -73,6 +74,25 @@ def test_dataframe(self):
         for i, j in zip(unpacked_list, list_of_dfs):
             assert i.equals(j)
 
+    def test_dataframe_with_tensorarray(self):
+        batched_df = pd.DataFrame(
+            {
+                "a": TensorArray([1, 2, 3, 4]),
+                "b": TensorArray([5, 6, 7, 8]),
+            }
+        )
+        split_df = pd.DataFrame(
+            {
+                "a": [1, 2, 3, 4],
+                "b": [5, 6, 7, 8],
+            }
+        )
+
+        unpacked_list = BatchingManager.split_dataframe(batched_df, 1)
+        assert len(unpacked_list) == 1
+        assert unpacked_list[0]["a"].equals(split_df["a"])
+        assert unpacked_list[0]["b"].equals(split_df["b"])
+
 
 class AdderPredictor(Predictor):
     def __init__(self, increment: int, do_double: bool) -> None:

Python version:	3.7.10
Ray version:	3.0.0.dev0
Dashboard:	http://127.0.0.1:8266
	pickup_community_area	trip_start_month	trip_start_hour	trip_start_day	trip_start_timestamp	trip_miles	dropoff_census_tract	payment_type	company	trip_seconds	dropoff_community_area	is_big_tip
0	NaN	5	19	6	1400269500	0.0	NaN	Credit Card	Chicago Elite Cab Corp. (Chicago Carriag	0.0	NaN	False
1	NaN	3	19	5	1362683700	0.0	NaN	Unknown	Chicago Elite Cab Corp.	300.0	NaN	False
2	60.0	10	2	3	1380593700	12.6	NaN	Cash	Taxi Affiliation Services	1380.0	NaN	False
3	10.0	10	1	2	1382319000	0.0	NaN	Cash	Taxi Affiliation Services	180.0	NaN	False
4	14.0	5	7	5	1369897200	0.0	NaN	Cash	Dispatch Taxi Affiliation	1080.0	NaN	False
Trial name	status	loc
Trial name	status	loc	iter	total time (s)	loss	_timestamp	_time_this_iter_s
TorchTrainer_a8585_00000	TERMINATED	172.28.0.2:2126
TorchTrainer_53c58_00000	TERMINATED	127.0.0.1:39548	4	36.4582	824.229	1658378932	6.46339