From 1931cf1df75be2b9c9e9ed821f3b6d50687c3227 Mon Sep 17 00:00:00 2001
From: Antoni Baum <antoni.baum@protonmail.com>
Date: Wed, 22 Jun 2022 17:33:50 +0000
Subject: [PATCH 1/2] [AIR] Remove unnecessary pandas from examples

---
 .../ray-air/doc_code/air_key_concepts.py      |   6 +-
 doc/source/ray-air/doc_code/preprocessors.py  |  22 +-
 doc/source/ray-air/doc_code/tf_starter.py     |   4 +-
 .../ray-air/doc_code/xgboost_starter.py       |  14 +-
 ...ert_existing_pytorch_code_to_ray_air.ipynb | 883 ++++++++++++------
 .../huggingface_text_classification.ipynb     |   3 +-
 .../ray-air/examples/lightgbm_example.ipynb   | 389 ++++----
 .../ray-air/examples/sklearn_example.ipynb    | 277 +++---
 .../ray-air/examples/upload_to_comet_ml.ipynb |  10 +-
 .../ray-air/examples/upload_to_wandb.ipynb    |  10 +-
 .../ray-air/examples/xgboost_example.ipynb    | 351 +++----
 ...ingface_basic_language_modeling_example.py |   3 +-
 .../tf/tensorflow_linear_dataset_example.py   |   5 +-
 13 files changed, 1119 insertions(+), 858 deletions(-)

diff --git a/doc/source/ray-air/doc_code/air_key_concepts.py b/doc/source/ray-air/doc_code/air_key_concepts.py
index 6d4e29798432..42727433751b 100644
--- a/doc/source/ray-air/doc_code/air_key_concepts.py
+++ b/doc/source/ray-air/doc_code/air_key_concepts.py
@@ -75,10 +75,8 @@
 batch_predictor = BatchPredictor.from_checkpoint(result.checkpoint, XGBoostPredictor)
 
 # Bulk batch prediction.
-predicted_labels = (
-    batch_predictor.predict(test_dataset)
-    .map_batches(lambda df: (df > 0.5).astype(int), batch_format="pandas")
-    .to_pandas(limit=float("inf"))
+predicted_labels = batch_predictor.predict(test_dataset).map_batches(
+    lambda df: (df > 0.5).astype(int), batch_format="pandas"
 )
 
 # Pipelined batch prediction: instead of processing the data in bulk, process it
diff --git a/doc/source/ray-air/doc_code/preprocessors.py b/doc/source/ray-air/doc_code/preprocessors.py
index d5eb3d86b164..1c19f08d2b8f 100644
--- a/doc/source/ray-air/doc_code/preprocessors.py
+++ b/doc/source/ray-air/doc_code/preprocessors.py
@@ -89,18 +89,16 @@
 
 batch_predictor = BatchPredictor.from_checkpoint(checkpoint, XGBoostPredictor)
 predicted_labels = batch_predictor.predict(test_dataset)
-print(predicted_labels.to_pandas())
-#    predictions
-# 0     0.098437
-# 1     5.604667
-# 2    11.405312
-# 3    15.684700
-# 4    23.990948
-# 5    29.900211
-# 6    34.599442
-# 7    40.696899
-# 8    45.681076
-# 9    50.290031
+predicted_labels.show()
+# {'predictions': 0.09843720495700836}
+# {'predictions': 5.604666709899902}
+# {'predictions': 11.405311584472656}
+# {'predictions': 15.684700012207031}
+# {'predictions': 23.990947723388672}
+# {'predictions': 29.900211334228516}
+# {'predictions': 34.59944152832031}
+# {'predictions': 40.6968994140625}
+# {'predictions': 45.68107604980469}
 # __predictor_end__
 
 
diff --git a/doc/source/ray-air/doc_code/tf_starter.py b/doc/source/ray-air/doc_code/tf_starter.py
index a121bedae7f5..360503294fdc 100644
--- a/doc/source/ray-air/doc_code/tf_starter.py
+++ b/doc/source/ray-air/doc_code/tf_starter.py
@@ -105,7 +105,7 @@ def train_func(config: dict):
 
 predictions = batch_predictor.predict(prediction_dataset, dtype=tf.float32)
 
-pandas_predictions = predictions.to_pandas(float("inf"))
+print(f"PREDICTIONS")
+predictions.show()
 
-print(f"PREDICTIONS\n{pandas_predictions}")
 # __air_tf_batchpred_end__
diff --git a/doc/source/ray-air/doc_code/xgboost_starter.py b/doc/source/ray-air/doc_code/xgboost_starter.py
index 94616fe77582..f2e7a3793d95 100644
--- a/doc/source/ray-air/doc_code/xgboost_starter.py
+++ b/doc/source/ray-air/doc_code/xgboost_starter.py
@@ -59,17 +59,13 @@
 
 batch_predictor = BatchPredictor.from_checkpoint(result.checkpoint, XGBoostPredictor)
 
-predicted_labels = (
-    batch_predictor.predict(test_dataset)
-    .map_batches(lambda df: (df > 0.5).astype(int), batch_format="pandas")
-    .to_pandas(limit=float("inf"))
+predicted_labels = batch_predictor.predict(test_dataset).map_batches(
+    lambda df: (df > 0.5).astype(int), batch_format="pandas"
 )
 print("PREDICTED LABELS")
-print(f"{predicted_labels}")
+predicted_labels.show()
 
-shap_values = batch_predictor.predict(test_dataset, pred_contribs=True).to_pandas(
-    limit=float("inf")
-)
+shap_values = batch_predictor.predict(test_dataset, pred_contribs=True)
 print("SHAP VALUES")
-print(f"{shap_values}")
+shap_values.show()
 # __air_xgb_batchpred_end__
diff --git a/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb b/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb
index 6e0379973ff3..a94a9e4cfc81 100644
--- a/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb
+++ b/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb
@@ -73,11 +73,105 @@
    "metadata": {},
    "outputs": [
     {
-     "name": "stderr",
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz\n",
+      "Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "763ad47190b1461285dc3ea3a8177e6f",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  0%|          | 0/26421880 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
      "output_type": "stream",
      "text": [
-      "/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/torchvision/datasets/mnist.py:498: UserWarning: The given NumPy array is not writeable, and PyTorch does not support non-writeable tensors. This means you can write to the underlying (supposedly non-writeable) NumPy array using the tensor. You may want to copy the array to protect its data or make it writeable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:180.)\n",
-      "  return torch.from_numpy(parsed.astype(m[2], copy=False)).view(*s)\n"
+      "Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw\n",
+      "\n",
+      "Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz\n",
+      "Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ab72b933d81942d9b8d2b8fc11f63120",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  0%|          | 0/29515 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw\n",
+      "\n",
+      "Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz\n",
+      "Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "06e73159e75d4aa2ac7f0f1ed37dc1e1",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  0%|          | 0/4422102 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw\n",
+      "\n",
+      "Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz\n",
+      "Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "744109b83b7f47628a798a69f2b54d72",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  0%|          | 0/5148 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw\n",
+      "\n"
      ]
     }
    ],
@@ -286,78 +380,78 @@
      "text": [
       "Epoch 1\n",
       "-------------------------------\n",
-      "loss: 2.304186  [    0/60000]\n",
-      "loss: 2.289454  [ 6400/60000]\n",
-      "loss: 2.275760  [12800/60000]\n",
-      "loss: 2.270670  [19200/60000]\n",
-      "loss: 2.240363  [25600/60000]\n",
-      "loss: 2.226019  [32000/60000]\n",
-      "loss: 2.230945  [38400/60000]\n",
-      "loss: 2.197411  [44800/60000]\n",
-      "loss: 2.197602  [51200/60000]\n",
-      "loss: 2.160038  [57600/60000]\n",
+      "loss: 2.310824  [    0/60000]\n",
+      "loss: 2.294673  [ 6400/60000]\n",
+      "loss: 2.279552  [12800/60000]\n",
+      "loss: 2.271212  [19200/60000]\n",
+      "loss: 2.253037  [25600/60000]\n",
+      "loss: 2.237454  [32000/60000]\n",
+      "loss: 2.229266  [38400/60000]\n",
+      "loss: 2.201499  [44800/60000]\n",
+      "loss: 2.204318  [51200/60000]\n",
+      "loss: 2.165509  [57600/60000]\n",
       "Test Error: \n",
-      " Accuracy: 43.4%, Avg loss: 2.156346 \n",
+      " Accuracy: 53.3%, Avg loss: 2.165069 \n",
       "\n",
       "Epoch 2\n",
       "-------------------------------\n",
-      "loss: 2.171642  [    0/60000]\n",
-      "loss: 2.156236  [ 6400/60000]\n",
-      "loss: 2.107473  [12800/60000]\n",
-      "loss: 2.118233  [19200/60000]\n",
-      "loss: 2.052204  [25600/60000]\n",
-      "loss: 2.006639  [32000/60000]\n",
-      "loss: 2.030226  [38400/60000]\n",
-      "loss: 1.953917  [44800/60000]\n",
-      "loss: 1.964219  [51200/60000]\n",
-      "loss: 1.873772  [57600/60000]\n",
+      "loss: 2.172770  [    0/60000]\n",
+      "loss: 2.162628  [ 6400/60000]\n",
+      "loss: 2.114871  [12800/60000]\n",
+      "loss: 2.129640  [19200/60000]\n",
+      "loss: 2.072733  [25600/60000]\n",
+      "loss: 2.029744  [32000/60000]\n",
+      "loss: 2.044677  [38400/60000]\n",
+      "loss: 1.968758  [44800/60000]\n",
+      "loss: 1.982601  [51200/60000]\n",
+      "loss: 1.903552  [57600/60000]\n",
       "Test Error: \n",
-      " Accuracy: 52.9%, Avg loss: 1.883439 \n",
+      " Accuracy: 56.8%, Avg loss: 1.906084 \n",
       "\n",
       "Epoch 3\n",
       "-------------------------------\n",
-      "loss: 1.929272  [    0/60000]\n",
-      "loss: 1.888294  [ 6400/60000]\n",
-      "loss: 1.783824  [12800/60000]\n",
-      "loss: 1.807983  [19200/60000]\n",
-      "loss: 1.694384  [25600/60000]\n",
-      "loss: 1.663575  [32000/60000]\n",
-      "loss: 1.671774  [38400/60000]\n",
-      "loss: 1.587723  [44800/60000]\n",
-      "loss: 1.612172  [51200/60000]\n",
-      "loss: 1.490934  [57600/60000]\n",
+      "loss: 1.929975  [    0/60000]\n",
+      "loss: 1.905118  [ 6400/60000]\n",
+      "loss: 1.797361  [12800/60000]\n",
+      "loss: 1.840994  [19200/60000]\n",
+      "loss: 1.721110  [25600/60000]\n",
+      "loss: 1.678175  [32000/60000]\n",
+      "loss: 1.691375  [38400/60000]\n",
+      "loss: 1.584185  [44800/60000]\n",
+      "loss: 1.619714  [51200/60000]\n",
+      "loss: 1.506852  [57600/60000]\n",
       "Test Error: \n",
-      " Accuracy: 59.6%, Avg loss: 1.520538 \n",
+      " Accuracy: 60.5%, Avg loss: 1.530285 \n",
       "\n",
       "Epoch 4\n",
       "-------------------------------\n",
-      "loss: 1.602018  [    0/60000]\n",
-      "loss: 1.556215  [ 6400/60000]\n",
-      "loss: 1.419982  [12800/60000]\n",
-      "loss: 1.469938  [19200/60000]\n",
-      "loss: 1.351850  [25600/60000]\n",
-      "loss: 1.363095  [32000/60000]\n",
-      "loss: 1.361990  [38400/60000]\n",
-      "loss: 1.299478  [44800/60000]\n",
-      "loss: 1.331679  [51200/60000]\n",
-      "loss: 1.225714  [57600/60000]\n",
+      "loss: 1.583245  [    0/60000]\n",
+      "loss: 1.556023  [ 6400/60000]\n",
+      "loss: 1.411425  [12800/60000]\n",
+      "loss: 1.488727  [19200/60000]\n",
+      "loss: 1.359579  [25600/60000]\n",
+      "loss: 1.360133  [32000/60000]\n",
+      "loss: 1.366381  [38400/60000]\n",
+      "loss: 1.279213  [44800/60000]\n",
+      "loss: 1.328040  [51200/60000]\n",
+      "loss: 1.223219  [57600/60000]\n",
       "Test Error: \n",
-      " Accuracy: 63.5%, Avg loss: 1.255372 \n",
+      " Accuracy: 62.9%, Avg loss: 1.254554 \n",
       "\n",
       "Epoch 5\n",
       "-------------------------------\n",
-      "loss: 1.341576  [    0/60000]\n",
-      "loss: 1.316398  [ 6400/60000]\n",
-      "loss: 1.161010  [12800/60000]\n",
-      "loss: 1.250706  [19200/60000]\n",
-      "loss: 1.122512  [25600/60000]\n",
-      "loss: 1.159244  [32000/60000]\n",
-      "loss: 1.169590  [38400/60000]\n",
-      "loss: 1.114988  [44800/60000]\n",
-      "loss: 1.154847  [51200/60000]\n",
-      "loss: 1.066008  [57600/60000]\n",
+      "loss: 1.319601  [    0/60000]\n",
+      "loss: 1.307626  [ 6400/60000]\n",
+      "loss: 1.148442  [12800/60000]\n",
+      "loss: 1.258462  [19200/60000]\n",
+      "loss: 1.127337  [25600/60000]\n",
+      "loss: 1.160929  [32000/60000]\n",
+      "loss: 1.174176  [38400/60000]\n",
+      "loss: 1.098028  [44800/60000]\n",
+      "loss: 1.149889  [51200/60000]\n",
+      "loss: 1.065084  [57600/60000]\n",
       "Test Error: \n",
-      " Accuracy: 64.9%, Avg loss: 1.089063 \n",
+      " Accuracy: 64.1%, Avg loss: 1.088535 \n",
       "\n",
       "Done!\n"
      ]
@@ -475,78 +569,78 @@
       ")\n",
       "Epoch 1\n",
       "-------------------------------\n",
-      "loss: 2.300660  [    0/60000]\n",
-      "loss: 2.296696  [ 6400/60000]\n",
-      "loss: 2.275931  [12800/60000]\n",
-      "loss: 2.269738  [19200/60000]\n",
-      "loss: 2.264045  [25600/60000]\n",
-      "loss: 2.234024  [32000/60000]\n",
-      "loss: 2.238547  [38400/60000]\n",
-      "loss: 2.209435  [44800/60000]\n",
-      "loss: 2.214618  [51200/60000]\n",
-      "loss: 2.185344  [57600/60000]\n",
+      "loss: 2.300413  [    0/60000]\n",
+      "loss: 2.286883  [ 6400/60000]\n",
+      "loss: 2.273655  [12800/60000]\n",
+      "loss: 2.268864  [19200/60000]\n",
+      "loss: 2.244969  [25600/60000]\n",
+      "loss: 2.216548  [32000/60000]\n",
+      "loss: 2.222040  [38400/60000]\n",
+      "loss: 2.182495  [44800/60000]\n",
+      "loss: 2.182766  [51200/60000]\n",
+      "loss: 2.156811  [57600/60000]\n",
       "Test Error: \n",
-      " Accuracy: 41.6%, Avg loss: 2.178503 \n",
+      " Accuracy: 50.6%, Avg loss: 2.145070 \n",
       "\n",
       "Epoch 2\n",
       "-------------------------------\n",
-      "loss: 2.183002  [    0/60000]\n",
-      "loss: 2.178075  [ 6400/60000]\n",
-      "loss: 2.126900  [12800/60000]\n",
-      "loss: 2.142223  [19200/60000]\n",
-      "loss: 2.095714  [25600/60000]\n",
-      "loss: 2.040030  [32000/60000]\n",
-      "loss: 2.066279  [38400/60000]\n",
-      "loss: 1.993092  [44800/60000]\n",
-      "loss: 2.015497  [51200/60000]\n",
-      "loss: 1.938319  [57600/60000]\n",
+      "loss: 2.150665  [    0/60000]\n",
+      "loss: 2.138080  [ 6400/60000]\n",
+      "loss: 2.086293  [12800/60000]\n",
+      "loss: 2.103044  [19200/60000]\n",
+      "loss: 2.041723  [25600/60000]\n",
+      "loss: 1.980555  [32000/60000]\n",
+      "loss: 2.000344  [38400/60000]\n",
+      "loss: 1.915977  [44800/60000]\n",
+      "loss: 1.930699  [51200/60000]\n",
+      "loss: 1.849836  [57600/60000]\n",
       "Test Error: \n",
-      " Accuracy: 53.5%, Avg loss: 1.936191 \n",
+      " Accuracy: 57.1%, Avg loss: 1.851586 \n",
       "\n",
       "Epoch 3\n",
       "-------------------------------\n",
-      "loss: 1.962513  [    0/60000]\n",
-      "loss: 1.940845  [ 6400/60000]\n",
-      "loss: 1.830932  [12800/60000]\n",
-      "loss: 1.868069  [19200/60000]\n",
-      "loss: 1.754753  [25600/60000]\n",
-      "loss: 1.703867  [32000/60000]\n",
-      "loss: 1.726961  [38400/60000]\n",
-      "loss: 1.626829  [44800/60000]\n",
-      "loss: 1.669507  [51200/60000]\n",
-      "loss: 1.556128  [57600/60000]\n",
+      "loss: 1.884133  [    0/60000]\n",
+      "loss: 1.847551  [ 6400/60000]\n",
+      "loss: 1.739998  [12800/60000]\n",
+      "loss: 1.781018  [19200/60000]\n",
+      "loss: 1.660957  [25600/60000]\n",
+      "loss: 1.619163  [32000/60000]\n",
+      "loss: 1.629720  [38400/60000]\n",
+      "loss: 1.535548  [44800/60000]\n",
+      "loss: 1.571056  [51200/60000]\n",
+      "loss: 1.458136  [57600/60000]\n",
       "Test Error: \n",
-      " Accuracy: 58.2%, Avg loss: 1.572178 \n",
+      " Accuracy: 60.9%, Avg loss: 1.483232 \n",
       "\n",
       "Epoch 4\n",
       "-------------------------------\n",
-      "loss: 1.636078  [    0/60000]\n",
-      "loss: 1.604536  [ 6400/60000]\n",
-      "loss: 1.457413  [12800/60000]\n",
-      "loss: 1.516031  [19200/60000]\n",
-      "loss: 1.394795  [25600/60000]\n",
-      "loss: 1.390730  [32000/60000]\n",
-      "loss: 1.400060  [38400/60000]\n",
-      "loss: 1.321162  [44800/60000]\n",
-      "loss: 1.366145  [51200/60000]\n",
-      "loss: 1.265664  [57600/60000]\n",
+      "loss: 1.549974  [    0/60000]\n",
+      "loss: 1.511189  [ 6400/60000]\n",
+      "loss: 1.374695  [12800/60000]\n",
+      "loss: 1.445348  [19200/60000]\n",
+      "loss: 1.323308  [25600/60000]\n",
+      "loss: 1.324354  [32000/60000]\n",
+      "loss: 1.328822  [38400/60000]\n",
+      "loss: 1.257330  [44800/60000]\n",
+      "loss: 1.298783  [51200/60000]\n",
+      "loss: 1.197863  [57600/60000]\n",
       "Test Error: \n",
-      " Accuracy: 62.5%, Avg loss: 1.288956 \n",
+      " Accuracy: 63.4%, Avg loss: 1.226258 \n",
       "\n",
       "Epoch 5\n",
       "-------------------------------\n",
-      "loss: 1.367953  [    0/60000]\n",
-      "loss: 1.350934  [ 6400/60000]\n",
-      "loss: 1.184691  [12800/60000]\n",
-      "loss: 1.275289  [19200/60000]\n",
-      "loss: 1.155229  [25600/60000]\n",
-      "loss: 1.179248  [32000/60000]\n",
-      "loss: 1.196911  [38400/60000]\n",
-      "loss: 1.129392  [44800/60000]\n",
-      "loss: 1.173347  [51200/60000]\n",
-      "loss: 1.095378  [57600/60000]\n",
+      "loss: 1.301627  [    0/60000]\n",
+      "loss: 1.279378  [ 6400/60000]\n",
+      "loss: 1.124873  [12800/60000]\n",
+      "loss: 1.230890  [19200/60000]\n",
+      "loss: 1.104782  [25600/60000]\n",
+      "loss: 1.130063  [32000/60000]\n",
+      "loss: 1.147206  [38400/60000]\n",
+      "loss: 1.083874  [44800/60000]\n",
+      "loss: 1.127730  [51200/60000]\n",
+      "loss: 1.044750  [57600/60000]\n",
       "Test Error: \n",
-      " Accuracy: 64.4%, Avg loss: 1.112272 \n",
+      " Accuracy: 64.6%, Avg loss: 1.066819 \n",
       "\n",
       "Done!\n"
      ]
@@ -716,7 +810,15 @@
    "execution_count": 14,
    "id": "3f79c731",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Package pickle5 becomes unnecessary in Python 3.8 and above. Its presence may confuse libraries including Ray. Please uninstall the package.\n"
+     ]
+    }
+   ],
    "source": [
     "import ray.train as train\n",
     "\n",
@@ -767,18 +869,18 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-06-14 13:02:53,006\tINFO services.py:1483 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8265\u001b[39m\u001b[22m\n"
+      "2022-06-22 16:28:31,525\tINFO services.py:1477 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8265\u001b[39m\u001b[22m\n"
      ]
     },
     {
      "data": {
       "text/html": [
-       "== Status ==<br>Current time: 2022-06-14 13:03:47 (running for 00:00:49.63)<br>Memory usage on this node: 10.3/16.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/3.63 GiB heap, 0.0/1.81 GiB objects<br>Result logdir: /Users/kai/ray_results/TorchTrainer_2022-06-14_13-02-55<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
+       "== Status ==<br>Current time: 2022-06-22 16:29:30 (running for 00:00:56.32)<br>Memory usage on this node: 7.5/31.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/8 CPUs, 0/0 GPUs, 0.0/15.32 GiB heap, 0.0/7.66 GiB objects<br>Result logdir: /home/ubuntu/ray_results/TorchTrainer_2022-06-22_16-28-33<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
        "<thead>\n",
-       "<tr><th>Trial name              </th><th>status    </th><th>loc           </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">   loss</th><th style=\"text-align: right;\">  _timestamp</th><th style=\"text-align: right;\">  _time_this_iter_s</th></tr>\n",
+       "<tr><th>Trial name              </th><th>status    </th><th>loc                  </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  loss</th><th style=\"text-align: right;\">  _timestamp</th><th style=\"text-align: right;\">  _time_this_iter_s</th></tr>\n",
        "</thead>\n",
        "<tbody>\n",
-       "<tr><td>TorchTrainer_8bcc7_00000</td><td>TERMINATED</td><td>127.0.0.1:7443</td><td style=\"text-align: right;\">     4</td><td style=\"text-align: right;\">         42.5615</td><td style=\"text-align: right;\">1.24926</td><td style=\"text-align: right;\">  1655204626</td><td style=\"text-align: right;\">            9.67353</td></tr>\n",
+       "<tr><td>TorchTrainer_5c84a_00000</td><td>TERMINATED</td><td>172.31.43.110:1481731</td><td style=\"text-align: right;\">     4</td><td style=\"text-align: right;\">         47.5635</td><td style=\"text-align: right;\">1.2631</td><td style=\"text-align: right;\">  1655915369</td><td style=\"text-align: right;\">            11.0948</td></tr>\n",
        "</tbody>\n",
        "</table><br><br>"
       ],
@@ -793,126 +895,126 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-06-14 13:03:00,221\tWARNING worker.py:1737 -- Warning: The actor TrainTrainable is very large (52 MiB). Check that its definition is not implicitly capturing a large array or other object in scope. Tip: use ray.put() to put large objects in the Ray object store.\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7448)\u001b[0m 2022-06-14 13:03:06,880\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=2]\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7449)\u001b[0m 2022-06-14 13:03:06,879\tINFO config.py:71 -- Setting up process group for: env:// [rank=1, world_size=2]\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7448)\u001b[0m 2022-06-14 13:03:08,303\tINFO train_loop_utils.py:293 -- Moving model to device: cpu\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7448)\u001b[0m 2022-06-14 13:03:08,303\tINFO train_loop_utils.py:331 -- Wrapping provided model in DDP.\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7449)\u001b[0m 2022-06-14 13:03:08,303\tINFO train_loop_utils.py:293 -- Moving model to device: cpu\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7449)\u001b[0m 2022-06-14 13:03:08,303\tINFO train_loop_utils.py:331 -- Wrapping provided model in DDP.\n"
+      "2022-06-22 16:28:38,581\tWARNING worker.py:1726 -- Warning: The actor TrainTrainable is very large (52 MiB). Check that its definition is not implicitly capturing a large array or other object in scope. Tip: use ray.put() to put large objects in the Ray object store.\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481763)\u001b[0m 2022-06-22 16:28:44,894\tINFO config.py:70 -- Setting up process group for: env:// [rank=0, world_size=2]\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481764)\u001b[0m 2022-06-22 16:28:44,891\tINFO config.py:70 -- Setting up process group for: env:// [rank=1, world_size=2]\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481763)\u001b[0m 2022-06-22 16:28:46,425\tINFO train_loop_utils.py:293 -- Moving model to device: cpu\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481763)\u001b[0m 2022-06-22 16:28:46,425\tINFO train_loop_utils.py:331 -- Wrapping provided model in DDP.\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481764)\u001b[0m 2022-06-22 16:28:46,425\tINFO train_loop_utils.py:293 -- Moving model to device: cpu\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481764)\u001b[0m 2022-06-22 16:28:46,425\tINFO train_loop_utils.py:331 -- Wrapping provided model in DDP.\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Result for TorchTrainer_8bcc7_00000:\n",
-      "  _time_this_iter_s: 9.377830982208252\n",
-      "  _timestamp: 1655204597\n",
+      "Result for TorchTrainer_5c84a_00000:\n",
+      "  _time_this_iter_s: 10.956670761108398\n",
+      "  _timestamp: 1655915337\n",
       "  _training_iteration: 1\n",
-      "  date: 2022-06-14_13-03-17\n",
+      "  date: 2022-06-22_16-28-57\n",
       "  done: false\n",
-      "  experiment_id: d262dbae86774c4fb809871401db393d\n",
-      "  hostname: Kais-MacBook-Pro.fritz.box\n",
+      "  experiment_id: dd2810ff95f74b1a8390f918b6c122fe\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 1\n",
-      "  loss: 2.1573975238071124\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 7443\n",
-      "  time_since_restore: 13.348651885986328\n",
-      "  time_this_iter_s: 13.348651885986328\n",
-      "  time_total_s: 13.348651885986328\n",
-      "  timestamp: 1655204597\n",
+      "  loss: 2.1705087840936748\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1481731\n",
+      "  time_since_restore: 14.807097911834717\n",
+      "  time_this_iter_s: 14.807097911834717\n",
+      "  time_total_s: 14.807097911834717\n",
+      "  timestamp: 1655915337\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 1\n",
-      "  trial_id: 8bcc7_00000\n",
-      "  warmup_time: 0.0038008689880371094\n",
+      "  trial_id: 5c84a_00000\n",
+      "  warmup_time: 0.0042934417724609375\n",
       "  \n",
-      "Result for TorchTrainer_8bcc7_00000:\n",
-      "  _time_this_iter_s: 9.486207962036133\n",
-      "  _timestamp: 1655204607\n",
+      "Result for TorchTrainer_5c84a_00000:\n",
+      "  _time_this_iter_s: 10.683637142181396\n",
+      "  _timestamp: 1655915347\n",
       "  _training_iteration: 2\n",
-      "  date: 2022-06-14_13-03-27\n",
+      "  date: 2022-06-22_16-29-07\n",
       "  done: false\n",
-      "  experiment_id: d262dbae86774c4fb809871401db393d\n",
-      "  hostname: Kais-MacBook-Pro.fritz.box\n",
+      "  experiment_id: dd2810ff95f74b1a8390f918b6c122fe\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 2\n",
-      "  loss: 1.88913657179304\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 7443\n",
-      "  time_since_restore: 22.830953121185303\n",
-      "  time_this_iter_s: 9.482301235198975\n",
-      "  time_total_s: 22.830953121185303\n",
-      "  timestamp: 1655204607\n",
+      "  loss: 1.918477459318319\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1481731\n",
+      "  time_since_restore: 25.498638153076172\n",
+      "  time_this_iter_s: 10.691540241241455\n",
+      "  time_total_s: 25.498638153076172\n",
+      "  timestamp: 1655915347\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 2\n",
-      "  trial_id: 8bcc7_00000\n",
-      "  warmup_time: 0.0038008689880371094\n",
+      "  trial_id: 5c84a_00000\n",
+      "  warmup_time: 0.0042934417724609375\n",
       "  \n",
-      "Result for TorchTrainer_8bcc7_00000:\n",
-      "  _time_this_iter_s: 10.05704402923584\n",
-      "  _timestamp: 1655204617\n",
+      "Result for TorchTrainer_5c84a_00000:\n",
+      "  _time_this_iter_s: 10.996578216552734\n",
+      "  _timestamp: 1655915358\n",
       "  _training_iteration: 3\n",
-      "  date: 2022-06-14_13-03-37\n",
+      "  date: 2022-06-22_16-29-18\n",
       "  done: false\n",
-      "  experiment_id: d262dbae86774c4fb809871401db393d\n",
-      "  hostname: Kais-MacBook-Pro.fritz.box\n",
+      "  experiment_id: dd2810ff95f74b1a8390f918b6c122fe\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 3\n",
-      "  loss: 1.5208747804544533\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 7443\n",
-      "  time_since_restore: 32.88802194595337\n",
-      "  time_this_iter_s: 10.057068824768066\n",
-      "  time_total_s: 32.88802194595337\n",
-      "  timestamp: 1655204617\n",
+      "  loss: 1.54556822397147\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1481731\n",
+      "  time_since_restore: 36.48866558074951\n",
+      "  time_this_iter_s: 10.99002742767334\n",
+      "  time_total_s: 36.48866558074951\n",
+      "  timestamp: 1655915358\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 3\n",
-      "  trial_id: 8bcc7_00000\n",
-      "  warmup_time: 0.0038008689880371094\n",
+      "  trial_id: 5c84a_00000\n",
+      "  warmup_time: 0.0042934417724609375\n",
       "  \n",
-      "Result for TorchTrainer_8bcc7_00000:\n",
-      "  _time_this_iter_s: 9.673533201217651\n",
-      "  _timestamp: 1655204626\n",
+      "Result for TorchTrainer_5c84a_00000:\n",
+      "  _time_this_iter_s: 11.09483027458191\n",
+      "  _timestamp: 1655915369\n",
       "  _training_iteration: 4\n",
-      "  date: 2022-06-14_13-03-46\n",
+      "  date: 2022-06-22_16-29-29\n",
       "  done: false\n",
-      "  experiment_id: d262dbae86774c4fb809871401db393d\n",
-      "  hostname: Kais-MacBook-Pro.fritz.box\n",
+      "  experiment_id: dd2810ff95f74b1a8390f918b6c122fe\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 4\n",
-      "  loss: 1.2492616913121217\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 7443\n",
-      "  time_since_restore: 42.56152319908142\n",
-      "  time_this_iter_s: 9.673501253128052\n",
-      "  time_total_s: 42.56152319908142\n",
-      "  timestamp: 1655204626\n",
+      "  loss: 1.263096342800529\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1481731\n",
+      "  time_since_restore: 47.56349587440491\n",
+      "  time_this_iter_s: 11.074830293655396\n",
+      "  time_total_s: 47.56349587440491\n",
+      "  timestamp: 1655915369\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 4\n",
-      "  trial_id: 8bcc7_00000\n",
-      "  warmup_time: 0.0038008689880371094\n",
+      "  trial_id: 5c84a_00000\n",
+      "  warmup_time: 0.0042934417724609375\n",
       "  \n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7449)\u001b[0m Done!\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7448)\u001b[0m Done!\n",
-      "Result for TorchTrainer_8bcc7_00000:\n",
-      "  _time_this_iter_s: 9.673533201217651\n",
-      "  _timestamp: 1655204626\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481763)\u001b[0m Done!\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481764)\u001b[0m Done!\n",
+      "Result for TorchTrainer_5c84a_00000:\n",
+      "  _time_this_iter_s: 11.09483027458191\n",
+      "  _timestamp: 1655915369\n",
       "  _training_iteration: 4\n",
-      "  date: 2022-06-14_13-03-46\n",
+      "  date: 2022-06-22_16-29-29\n",
       "  done: true\n",
-      "  experiment_id: d262dbae86774c4fb809871401db393d\n",
+      "  experiment_id: dd2810ff95f74b1a8390f918b6c122fe\n",
       "  experiment_tag: '0'\n",
-      "  hostname: Kais-MacBook-Pro.fritz.box\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 4\n",
-      "  loss: 1.2492616913121217\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 7443\n",
-      "  time_since_restore: 42.56152319908142\n",
-      "  time_this_iter_s: 9.673501253128052\n",
-      "  time_total_s: 42.56152319908142\n",
-      "  timestamp: 1655204626\n",
+      "  loss: 1.263096342800529\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1481731\n",
+      "  time_since_restore: 47.56349587440491\n",
+      "  time_this_iter_s: 11.074830293655396\n",
+      "  time_total_s: 47.56349587440491\n",
+      "  timestamp: 1655915369\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 4\n",
-      "  trial_id: 8bcc7_00000\n",
-      "  warmup_time: 0.0038008689880371094\n",
+      "  trial_id: 5c84a_00000\n",
+      "  warmup_time: 0.0042934417724609375\n",
       "  \n"
      ]
     },
@@ -920,14 +1022,14 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-06-14 13:03:47,154\tINFO tune.py:742 -- Total run time: 51.21 seconds (49.63 seconds for the tuning loop).\n"
+      "2022-06-22 16:29:31,024\tINFO tune.py:734 -- Total run time: 57.58 seconds (56.31 seconds for the tuning loop).\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Last result: {'loss': 1.2492616913121217, '_timestamp': 1655204626, '_time_this_iter_s': 9.673533201217651, '_training_iteration': 4, 'time_this_iter_s': 9.673501253128052, 'done': True, 'timesteps_total': None, 'episodes_total': None, 'training_iteration': 4, 'trial_id': '8bcc7_00000', 'experiment_id': 'd262dbae86774c4fb809871401db393d', 'date': '2022-06-14_13-03-46', 'timestamp': 1655204626, 'time_total_s': 42.56152319908142, 'pid': 7443, 'hostname': 'Kais-MacBook-Pro.fritz.box', 'node_ip': '127.0.0.1', 'config': {}, 'time_since_restore': 42.56152319908142, 'timesteps_since_restore': 0, 'iterations_since_restore': 4, 'warmup_time': 0.0038008689880371094, 'experiment_tag': '0'}\n"
+      "Last result: {'loss': 1.263096342800529, '_timestamp': 1655915369, '_time_this_iter_s': 11.09483027458191, '_training_iteration': 4, 'time_this_iter_s': 11.074830293655396, 'done': True, 'timesteps_total': None, 'episodes_total': None, 'training_iteration': 4, 'trial_id': '5c84a_00000', 'experiment_id': 'dd2810ff95f74b1a8390f918b6c122fe', 'date': '2022-06-22_16-29-29', 'timestamp': 1655915369, 'time_total_s': 47.56349587440491, 'pid': 1481731, 'hostname': 'ip-172-31-43-110', 'node_ip': '172.31.43.110', 'config': {}, 'time_since_restore': 47.56349587440491, 'timesteps_since_restore': 0, 'iterations_since_restore': 4, 'warmup_time': 0.0042934417724609375, 'experiment_tag': '0'}\n"
      ]
     }
    ],
@@ -1051,12 +1153,12 @@
     {
      "data": {
       "text/html": [
-       "== Status ==<br>Current time: 2022-06-14 13:04:34 (running for 00:00:47.20)<br>Memory usage on this node: 11.4/16.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/3.63 GiB heap, 0.0/1.81 GiB objects<br>Result logdir: /Users/kai/ray_results/TorchTrainer_2022-06-14_13-03-47<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
+       "== Status ==<br>Current time: 2022-06-22 16:30:41 (running for 00:00:56.46)<br>Memory usage on this node: 7.2/31.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/8 CPUs, 0/0 GPUs, 0.0/15.32 GiB heap, 0.0/7.66 GiB objects<br>Result logdir: /home/ubuntu/ray_results/TorchTrainer_2022-06-22_16-29-44<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
        "<thead>\n",
-       "<tr><th>Trial name              </th><th>status    </th><th>loc           </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">   loss</th><th style=\"text-align: right;\">  _timestamp</th><th style=\"text-align: right;\">  _time_this_iter_s</th></tr>\n",
+       "<tr><th>Trial name              </th><th>status    </th><th>loc                  </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">   loss</th><th style=\"text-align: right;\">  _timestamp</th><th style=\"text-align: right;\">  _time_this_iter_s</th></tr>\n",
        "</thead>\n",
        "<tbody>\n",
-       "<tr><td>TorchTrainer_a9dda_00000</td><td>TERMINATED</td><td>127.0.0.1:7485</td><td style=\"text-align: right;\">     4</td><td style=\"text-align: right;\">         41.9863</td><td style=\"text-align: right;\">1.22261</td><td style=\"text-align: right;\">  1655204673</td><td style=\"text-align: right;\">            9.94109</td></tr>\n",
+       "<tr><td>TorchTrainer_86514_00000</td><td>TERMINATED</td><td>172.31.43.110:1481879</td><td style=\"text-align: right;\">     4</td><td style=\"text-align: right;\">         53.1038</td><td style=\"text-align: right;\">1.24844</td><td style=\"text-align: right;\">  1655915440</td><td style=\"text-align: right;\">            11.4238</td></tr>\n",
        "</tbody>\n",
        "</table><br><br>"
       ],
@@ -1071,134 +1173,280 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7491)\u001b[0m 2022-06-14 13:03:54,234\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=2]\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7492)\u001b[0m 2022-06-14 13:03:54,234\tINFO config.py:71 -- Setting up process group for: env:// [rank=1, world_size=2]\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7491)\u001b[0m /Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/torchvision/datasets/mnist.py:498: UserWarning: The given NumPy array is not writeable, and PyTorch does not support non-writeable tensors. This means you can write to the underlying (supposedly non-writeable) NumPy array using the tensor. You may want to copy the array to protect its data or make it writeable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:180.)\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7491)\u001b[0m   return torch.from_numpy(parsed.astype(m[2], copy=False)).view(*s)\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7491)\u001b[0m 2022-06-14 13:03:55,404\tINFO train_loop_utils.py:293 -- Moving model to device: cpu\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7491)\u001b[0m 2022-06-14 13:03:55,404\tINFO train_loop_utils.py:331 -- Wrapping provided model in DDP.\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7492)\u001b[0m /Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/torchvision/datasets/mnist.py:498: UserWarning: The given NumPy array is not writeable, and PyTorch does not support non-writeable tensors. This means you can write to the underlying (supposedly non-writeable) NumPy array using the tensor. You may want to copy the array to protect its data or make it writeable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at  ../torch/csrc/utils/tensor_numpy.cpp:180.)\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7492)\u001b[0m   return torch.from_numpy(parsed.astype(m[2], copy=False)).view(*s)\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7492)\u001b[0m 2022-06-14 13:03:55,404\tINFO train_loop_utils.py:293 -- Moving model to device: cpu\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7492)\u001b[0m 2022-06-14 13:03:55,404\tINFO train_loop_utils.py:331 -- Wrapping provided model in DDP.\n"
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m 2022-06-22 16:29:50,060\tINFO config.py:70 -- Setting up process group for: env:// [rank=1, world_size=2]\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m 2022-06-22 16:29:50,039\tINFO config.py:70 -- Setting up process group for: env:// [rank=0, world_size=2]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  0%|          | 0/26421880 [00:00<?, ?it/s]\n",
+      "  0%|          | 0/26421880 [00:00<?, ?it/s]\n",
+      "  0%|          | 41984/26421880 [00:00<01:12, 361943.13it/s]\n",
+      "  0%|          | 41984/26421880 [00:00<01:10, 375108.71it/s]\n",
+      "  0%|          | 96256/26421880 [00:00<00:57, 459571.31it/s]\n",
+      "  0%|          | 79872/26421880 [00:00<01:10, 376211.09it/s]\n",
+      "  1%|          | 205824/26421880 [00:00<00:35, 736411.92it/s]\n",
+      "  0%|          | 130048/26421880 [00:00<01:00, 431147.91it/s]\n",
+      "  2%|▏         | 427008/26421880 [00:00<00:20, 1299733.59it/s]\n",
+      "  1%|          | 274432/26421880 [00:00<00:31, 822829.39it/s]\n",
+      "  3%|▎         | 870400/26421880 [00:00<00:10, 2402951.16it/s]\n",
+      "  2%|▏         | 565248/26421880 [00:00<00:16, 1558525.69it/s]\n",
+      "  7%|▋         | 1754112/26421880 [00:00<00:05, 4545943.78it/s]\n",
+      "  4%|▍         | 1145856/26421880 [00:00<00:08, 2984121.04it/s]\n",
+      " 13%|█▎        | 3316736/26421880 [00:00<00:02, 8105757.73it/s]\n",
+      "  9%|▊         | 2288640/26421880 [00:00<00:04, 5702264.83it/s]\n",
+      " 19%|█▊        | 4894720/26421880 [00:00<00:02, 10492520.90it/s]\n",
+      " 15%|█▍        | 3875840/26421880 [00:00<00:02, 8912112.28it/s]\n",
+      " 24%|██▍       | 6440960/26421880 [00:00<00:01, 11998939.91it/s]\n",
+      " 20%|██        | 5402624/26421880 [00:00<00:01, 10824900.56it/s]\n",
+      " 30%|███       | 7987200/26421880 [00:01<00:01, 13030704.03it/s]\n",
+      " 27%|██▋       | 7032832/26421880 [00:01<00:01, 12501970.20it/s]\n",
+      " 36%|███▌      | 9534464/26421880 [00:01<00:01, 13735819.55it/s]\n",
+      " 33%|███▎      | 8593408/26421880 [00:01<00:01, 13437913.13it/s]\n",
+      " 42%|████▏     | 11080704/26421880 [00:01<00:01, 14207667.46it/s]\n",
+      " 38%|███▊      | 10128384/26421880 [00:01<00:01, 14011409.41it/s]\n",
+      " 48%|████▊     | 12626944/26421880 [00:01<00:00, 14542620.11it/s]\n",
+      " 44%|████▍     | 11660288/26421880 [00:01<00:01, 14405849.73it/s]\n",
+      " 54%|█████▎    | 14174208/26421880 [00:01<00:00, 14759412.47it/s]\n",
+      " 59%|█████▉    | 15720448/26421880 [00:01<00:00, 14933524.60it/s]\n",
+      " 50%|████▉     | 13135872/26421880 [00:01<00:00, 14499791.65it/s]\n",
+      " 65%|██████▌   | 17266688/26421880 [00:01<00:00, 15051136.83it/s]\n",
+      " 56%|█████▌    | 14682112/26421880 [00:01<00:00, 14772346.00it/s]\n",
+      " 71%|███████   | 18813952/26421880 [00:01<00:00, 15130807.12it/s]\n",
+      " 61%|██████▏   | 16228352/26421880 [00:01<00:00, 14967937.04it/s]\n",
+      " 77%|███████▋  | 20360192/26421880 [00:01<00:00, 15195261.31it/s]\n",
+      " 67%|██████▋   | 17775616/26421880 [00:01<00:00, 15112781.93it/s]\n",
+      " 83%|████████▎ | 21906432/26421880 [00:01<00:00, 15236573.97it/s]\n",
+      " 73%|███████▎  | 19321856/26421880 [00:01<00:00, 15212408.07it/s]\n",
+      " 89%|████████▉ | 23453696/26421880 [00:02<00:00, 15266838.91it/s]\n",
+      " 79%|███████▉  | 20868096/26421880 [00:01<00:00, 15269608.06it/s]\n",
+      " 95%|█████████▍| 24999936/26421880 [00:02<00:00, 15289978.61it/s]\n",
+      " 91%|█████████ | 23961600/26421880 [00:02<00:00, 15340254.66it/s]\n",
+      "26422272it [00:02, 11870579.44it/s]                              \n",
+      " 97%|█████████▋| 25507840/26421880 [00:02<00:00, 15364219.70it/s]\n",
+      "26422272it [00:02, 11859017.59it/s]                              \n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m \n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m \n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  0%|          | 0/29515 [00:00<?, ?it/s]m \n",
+      "  0%|          | 0/29515 [00:00<?, ?it/s]m \n",
+      "29696it [00:00, 295064.38it/s]                           \n",
+      "29696it [00:00, 296748.03it/s]           m \n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Result for TorchTrainer_a9dda_00000:\n",
-      "  _time_this_iter_s: 10.072710990905762\n",
-      "  _timestamp: 1655204645\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m \n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m \n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  0%|          | 0/4422102 [00:00<?, ?it/s]\n",
+      "  0%|          | 0/4422102 [00:00<?, ?it/s]\n",
+      "  1%|          | 34816/4422102 [00:00<00:12, 348148.71it/s]\n",
+      "  1%|          | 22528/4422102 [00:00<00:19, 225237.25it/s]\n",
+      "  2%|▏         | 69632/4422102 [00:00<00:12, 346462.21it/s]\n",
+      "  1%|          | 45056/4422102 [00:00<00:19, 224942.66it/s]\n",
+      "  2%|▏         | 104448/4422102 [00:00<00:12, 347157.14it/s]\n",
+      "  2%|▏         | 99328/4422102 [00:00<00:11, 368964.83it/s]\n",
+      "  4%|▍         | 184320/4422102 [00:00<00:08, 524405.18it/s]\n",
+      "  4%|▍         | 189440/4422102 [00:00<00:07, 577214.69it/s]\n",
+      "  9%|▊         | 384000/4422102 [00:00<00:03, 1052895.14it/s]\n",
+      "  9%|▉         | 396288/4422102 [00:00<00:03, 1111874.46it/s]\n",
+      " 18%|█▊        | 779264/4422102 [00:00<00:01, 2033939.42it/s]\n",
+      " 18%|█▊        | 806912/4422102 [00:00<00:01, 2121674.81it/s]\n",
+      " 36%|███▌      | 1573888/4422102 [00:00<00:00, 3955289.29it/s]\n",
+      " 37%|███▋      | 1630208/4422102 [00:00<00:00, 4106422.09it/s]\n",
+      "4422656it [00:00, 5316997.96it/s]                             \n",
+      "4422656it [00:00, 5349419.81it/s]                             \n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m \n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m \n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "6144it [00:00, 49085340.53it/s]         0m \n",
+      "6144it [00:00, 43975774.36it/s]         0m \n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m 2022-06-22 16:29:55,912\tINFO train_loop_utils.py:293 -- Moving model to device: cpu\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m 2022-06-22 16:29:55,913\tINFO train_loop_utils.py:331 -- Wrapping provided model in DDP.\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m 2022-06-22 16:29:55,899\tINFO train_loop_utils.py:293 -- Moving model to device: cpu\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m 2022-06-22 16:29:55,900\tINFO train_loop_utils.py:331 -- Wrapping provided model in DDP.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m \n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m \n",
+      "Result for TorchTrainer_86514_00000:\n",
+      "  _time_this_iter_s: 17.002915143966675\n",
+      "  _timestamp: 1655915407\n",
       "  _training_iteration: 1\n",
-      "  date: 2022-06-14_13-04-05\n",
+      "  date: 2022-06-22_16-30-07\n",
       "  done: false\n",
-      "  experiment_id: 1f001dea6bd948c39235e589f07fcd8f\n",
-      "  hostname: Kais-MacBook-Pro.fritz.box\n",
+      "  experiment_id: 1e7954bef1c6432785374780fb0da29e\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 1\n",
-      "  loss: 2.1288197860596285\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 7485\n",
+      "  loss: 2.1645877740945028\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1481879\n",
       "  should_checkpoint: true\n",
-      "  time_since_restore: 13.953598976135254\n",
-      "  time_this_iter_s: 13.953598976135254\n",
-      "  time_total_s: 13.953598976135254\n",
-      "  timestamp: 1655204645\n",
+      "  time_since_restore: 19.680341005325317\n",
+      "  time_this_iter_s: 19.680341005325317\n",
+      "  time_total_s: 19.680341005325317\n",
+      "  timestamp: 1655915407\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 1\n",
-      "  trial_id: a9dda_00000\n",
-      "  warmup_time: 0.0025289058685302734\n",
+      "  trial_id: '86514_00000'\n",
+      "  warmup_time: 0.004637956619262695\n",
       "  \n",
-      "Result for TorchTrainer_a9dda_00000:\n",
-      "  _time_this_iter_s: 9.129379987716675\n",
-      "  _timestamp: 1655204654\n",
+      "Result for TorchTrainer_86514_00000:\n",
+      "  _time_this_iter_s: 10.904694557189941\n",
+      "  _timestamp: 1655915418\n",
       "  _training_iteration: 2\n",
-      "  date: 2022-06-14_13-04-14\n",
+      "  date: 2022-06-22_16-30-18\n",
       "  done: false\n",
-      "  experiment_id: 1f001dea6bd948c39235e589f07fcd8f\n",
-      "  hostname: Kais-MacBook-Pro.fritz.box\n",
+      "  experiment_id: 1e7954bef1c6432785374780fb0da29e\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 2\n",
-      "  loss: 1.8414961441307311\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 7485\n",
+      "  loss: 1.905545388057733\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1481879\n",
       "  should_checkpoint: true\n",
-      "  time_since_restore: 23.07395100593567\n",
-      "  time_this_iter_s: 9.120352029800415\n",
-      "  time_total_s: 23.07395100593567\n",
-      "  timestamp: 1655204654\n",
+      "  time_since_restore: 30.562681436538696\n",
+      "  time_this_iter_s: 10.882340431213379\n",
+      "  time_total_s: 30.562681436538696\n",
+      "  timestamp: 1655915418\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 2\n",
-      "  trial_id: a9dda_00000\n",
-      "  warmup_time: 0.0025289058685302734\n",
+      "  trial_id: '86514_00000'\n",
+      "  warmup_time: 0.004637956619262695\n",
       "  \n",
-      "Result for TorchTrainer_a9dda_00000:\n",
-      "  _time_this_iter_s: 8.954904079437256\n",
-      "  _timestamp: 1655204663\n",
+      "Result for TorchTrainer_86514_00000:\n",
+      "  _time_this_iter_s: 11.091916799545288\n",
+      "  _timestamp: 1655915429\n",
       "  _training_iteration: 3\n",
-      "  date: 2022-06-14_13-04-23\n",
+      "  date: 2022-06-22_16-30-29\n",
       "  done: false\n",
-      "  experiment_id: 1f001dea6bd948c39235e589f07fcd8f\n",
-      "  hostname: Kais-MacBook-Pro.fritz.box\n",
+      "  experiment_id: 1e7954bef1c6432785374780fb0da29e\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 3\n",
-      "  loss: 1.4759019393070487\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 7485\n",
+      "  loss: 1.531144731363673\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1481879\n",
       "  should_checkpoint: true\n",
-      "  time_since_restore: 32.03323698043823\n",
-      "  time_this_iter_s: 8.959285974502563\n",
-      "  time_total_s: 32.03323698043823\n",
-      "  timestamp: 1655204663\n",
+      "  time_since_restore: 41.66515636444092\n",
+      "  time_this_iter_s: 11.102474927902222\n",
+      "  time_total_s: 41.66515636444092\n",
+      "  timestamp: 1655915429\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 3\n",
-      "  trial_id: a9dda_00000\n",
-      "  warmup_time: 0.0025289058685302734\n",
+      "  trial_id: '86514_00000'\n",
+      "  warmup_time: 0.004637956619262695\n",
       "  \n",
-      "Result for TorchTrainer_a9dda_00000:\n",
-      "  _time_this_iter_s: 9.941093921661377\n",
-      "  _timestamp: 1655204673\n",
+      "Result for TorchTrainer_86514_00000:\n",
+      "  _time_this_iter_s: 11.423810482025146\n",
+      "  _timestamp: 1655915440\n",
       "  _training_iteration: 4\n",
-      "  date: 2022-06-14_13-04-33\n",
+      "  date: 2022-06-22_16-30-40\n",
       "  done: false\n",
-      "  experiment_id: 1f001dea6bd948c39235e589f07fcd8f\n",
-      "  hostname: Kais-MacBook-Pro.fritz.box\n",
+      "  experiment_id: 1e7954bef1c6432785374780fb0da29e\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 4\n",
-      "  loss: 1.2226136068629612\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 7485\n",
+      "  loss: 1.2484390530616614\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1481879\n",
       "  should_checkpoint: true\n",
-      "  time_since_restore: 41.98633909225464\n",
-      "  time_this_iter_s: 9.953102111816406\n",
-      "  time_total_s: 41.98633909225464\n",
-      "  timestamp: 1655204673\n",
+      "  time_since_restore: 53.103771924972534\n",
+      "  time_this_iter_s: 11.438615560531616\n",
+      "  time_total_s: 53.103771924972534\n",
+      "  timestamp: 1655915440\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 4\n",
-      "  trial_id: a9dda_00000\n",
-      "  warmup_time: 0.0025289058685302734\n",
+      "  trial_id: '86514_00000'\n",
+      "  warmup_time: 0.004637956619262695\n",
       "  \n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7492)\u001b[0m Done!\n",
-      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=7491)\u001b[0m Done!\n",
-      "Result for TorchTrainer_a9dda_00000:\n",
-      "  _time_this_iter_s: 9.941093921661377\n",
-      "  _timestamp: 1655204673\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481912)\u001b[0m Done!\n",
+      "\u001b[2m\u001b[36m(BaseWorkerMixin pid=1481911)\u001b[0m Done!\n",
+      "Result for TorchTrainer_86514_00000:\n",
+      "  _time_this_iter_s: 11.423810482025146\n",
+      "  _timestamp: 1655915440\n",
       "  _training_iteration: 4\n",
-      "  date: 2022-06-14_13-04-33\n",
+      "  date: 2022-06-22_16-30-40\n",
       "  done: true\n",
-      "  experiment_id: 1f001dea6bd948c39235e589f07fcd8f\n",
+      "  experiment_id: 1e7954bef1c6432785374780fb0da29e\n",
       "  experiment_tag: '0'\n",
-      "  hostname: Kais-MacBook-Pro.fritz.box\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 4\n",
-      "  loss: 1.2226136068629612\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 7485\n",
+      "  loss: 1.2484390530616614\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1481879\n",
       "  should_checkpoint: true\n",
-      "  time_since_restore: 41.98633909225464\n",
-      "  time_this_iter_s: 9.953102111816406\n",
-      "  time_total_s: 41.98633909225464\n",
-      "  timestamp: 1655204673\n",
+      "  time_since_restore: 53.103771924972534\n",
+      "  time_this_iter_s: 11.438615560531616\n",
+      "  time_total_s: 53.103771924972534\n",
+      "  timestamp: 1655915440\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 4\n",
-      "  trial_id: a9dda_00000\n",
-      "  warmup_time: 0.0025289058685302734\n",
+      "  trial_id: '86514_00000'\n",
+      "  warmup_time: 0.004637956619262695\n",
       "  \n"
      ]
     },
@@ -1206,7 +1454,7 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-06-14 13:04:34,537\tINFO tune.py:742 -- Total run time: 47.32 seconds (47.19 seconds for the tuning loop).\n"
+      "2022-06-22 16:30:41,236\tINFO tune.py:734 -- Total run time: 56.58 seconds (56.46 seconds for the tuning loop).\n"
      ]
     }
    ],
@@ -1237,8 +1485,8 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Last result: {'loss': 1.2226136068629612, '_timestamp': 1655204673, '_time_this_iter_s': 9.941093921661377, '_training_iteration': 4, 'time_this_iter_s': 9.953102111816406, 'should_checkpoint': True, 'done': True, 'timesteps_total': None, 'episodes_total': None, 'training_iteration': 4, 'trial_id': 'a9dda_00000', 'experiment_id': '1f001dea6bd948c39235e589f07fcd8f', 'date': '2022-06-14_13-04-33', 'timestamp': 1655204673, 'time_total_s': 41.98633909225464, 'pid': 7485, 'hostname': 'Kais-MacBook-Pro.fritz.box', 'node_ip': '127.0.0.1', 'config': {}, 'time_since_restore': 41.98633909225464, 'timesteps_since_restore': 0, 'iterations_since_restore': 4, 'warmup_time': 0.0025289058685302734, 'experiment_tag': '0'}\n",
-      "Checkpoint: <ray.air.checkpoint.Checkpoint object at 0x1bd3cdcd0>\n"
+      "Last result: {'loss': 1.2484390530616614, '_timestamp': 1655915440, '_time_this_iter_s': 11.423810482025146, '_training_iteration': 4, 'time_this_iter_s': 11.438615560531616, 'should_checkpoint': True, 'done': True, 'timesteps_total': None, 'episodes_total': None, 'training_iteration': 4, 'trial_id': '86514_00000', 'experiment_id': '1e7954bef1c6432785374780fb0da29e', 'date': '2022-06-22_16-30-40', 'timestamp': 1655915440, 'time_total_s': 53.103771924972534, 'pid': 1481879, 'hostname': 'ip-172-31-43-110', 'node_ip': '172.31.43.110', 'config': {}, 'time_since_restore': 53.103771924972534, 'timesteps_since_restore': 0, 'iterations_since_restore': 4, 'warmup_time': 0.004637956619262695, 'experiment_tag': '0'}\n",
+      "Checkpoint: <ray.air.checkpoint.Checkpoint object at 0x7f15317fc160>\n"
      ]
     }
    ],
@@ -1393,7 +1641,19 @@
    "execution_count": 23,
    "id": "4d8b0f50",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "ename": "ImportError",
+     "evalue": "cannot import name 'BatchPredictor' from 'ray.air' (/home/ubuntu/ray/python/ray/air/__init__.py)",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[0;31mImportError\u001b[0m                               Traceback (most recent call last)",
+      "\u001b[1;32m/home/ubuntu/ray/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb Cell 49'\u001b[0m in \u001b[0;36m<cell line: 1>\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> <a href='vscode-notebook-cell://ssh-remote%2Bec2-18-118-29-213.us-east-2.compute.amazonaws.com/home/ubuntu/ray/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb#ch0000048vscode-remote?line=0'>1</a>\u001b[0m \u001b[39mfrom\u001b[39;00m \u001b[39mray\u001b[39;00m\u001b[39m.\u001b[39;00m\u001b[39mair\u001b[39;00m \u001b[39mimport\u001b[39;00m BatchPredictor\n\u001b[1;32m      <a href='vscode-notebook-cell://ssh-remote%2Bec2-18-118-29-213.us-east-2.compute.amazonaws.com/home/ubuntu/ray/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb#ch0000048vscode-remote?line=1'>2</a>\u001b[0m \u001b[39mfrom\u001b[39;00m \u001b[39mray\u001b[39;00m\u001b[39m.\u001b[39;00m\u001b[39mair\u001b[39;00m\u001b[39m.\u001b[39;00m\u001b[39mpredictors\u001b[39;00m\u001b[39m.\u001b[39;00m\u001b[39mintegrations\u001b[39;00m\u001b[39m.\u001b[39;00m\u001b[39mtorch\u001b[39;00m \u001b[39mimport\u001b[39;00m TorchPredictor\n\u001b[1;32m      <a href='vscode-notebook-cell://ssh-remote%2Bec2-18-118-29-213.us-east-2.compute.amazonaws.com/home/ubuntu/ray/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb#ch0000048vscode-remote?line=3'>4</a>\u001b[0m batch_predictor \u001b[39m=\u001b[39m BatchPredictor\u001b[39m.\u001b[39mfrom_checkpoint(result\u001b[39m.\u001b[39mcheckpoint, TorchPredictor, model\u001b[39m=\u001b[39mNeuralNetwork())\n",
+      "\u001b[0;31mImportError\u001b[0m: cannot import name 'BatchPredictor' from 'ray.air' (/home/ubuntu/ray/python/ray/air/__init__.py)"
+     ]
+    }
+   ],
    "source": [
     "from ray.air import BatchPredictor\n",
     "from ray.air.predictors.integrations.torch import TorchPredictor\n",
@@ -1411,7 +1671,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 24,
+   "execution_count": null,
    "id": "8cb0556f",
    "metadata": {},
    "outputs": [],
@@ -1431,7 +1691,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 25,
+   "execution_count": null,
    "id": "8a823f7a",
    "metadata": {},
    "outputs": [
@@ -1452,12 +1712,12 @@
    "id": "41094a55",
    "metadata": {},
    "source": [
-    "`results` is another Ray Dataset. We can use `results.to_pandas()` to see our prediction results:"
+    "`results` is another Ray Dataset. We can use `results.show()` to see our prediction results:"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 26,
+   "execution_count": null,
    "id": "d3dce40d",
    "metadata": {},
    "outputs": [
@@ -1558,7 +1818,7 @@
     }
    ],
    "source": [
-    "results.to_pandas()"
+    "results.show()"
    ]
   },
   {
@@ -1571,7 +1831,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 27,
+   "execution_count": null,
    "id": "f17b5c10",
    "metadata": {},
    "outputs": [
@@ -1599,7 +1859,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 28,
+   "execution_count": null,
    "id": "207e13b9",
    "metadata": {},
    "outputs": [],
@@ -1618,7 +1878,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 29,
+   "execution_count": null,
    "id": "2b2decc6",
    "metadata": {},
    "outputs": [
@@ -1719,7 +1979,7 @@
     }
    ],
    "source": [
-    "merged.to_pandas()"
+    "merged.show()"
    ]
   },
   {
@@ -1744,7 +2004,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "Python 3.8.10 ('venv': venv)",
    "language": "python",
    "name": "python3"
   },
@@ -1758,7 +2018,12 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.10"
+  },
+  "vscode": {
+   "interpreter": {
+    "hash": "3c0d54d489a08ae47a06eae2fd00ff032d6cddb527c382959b7b2575f6a8167f"
+   }
   }
  },
  "nbformat": 4,
diff --git a/doc/source/ray-air/examples/huggingface_text_classification.ipynb b/doc/source/ray-air/examples/huggingface_text_classification.ipynb
index e75ed1e95cdb..529e5f236a99 100644
--- a/doc/source/ray-air/examples/huggingface_text_classification.ipynb
+++ b/doc/source/ray-air/examples/huggingface_text_classification.ipynb
@@ -1384,8 +1384,7 @@
         ")\n",
         "data = ray.data.from_pandas(pd.DataFrame(sentences, columns=[\"sentence\"]))\n",
         "prediction = predictor.predict(data)\n",
-        "prediction = prediction.to_pandas()\n",
-        "prediction"
+        "prediction.show()"
       ]
     },
     {
diff --git a/doc/source/ray-air/examples/lightgbm_example.ipynb b/doc/source/ray-air/examples/lightgbm_example.ipynb
index c59ba7262f61..4083be1dfe80 100644
--- a/doc/source/ray-air/examples/lightgbm_example.ipynb
+++ b/doc/source/ray-air/examples/lightgbm_example.ipynb
@@ -37,17 +37,13 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 4,
    "id": "102ef1ac",
    "metadata": {},
    "outputs": [],
    "source": [
-    "import argparse\n",
-    "import math\n",
     "from typing import Tuple\n",
     "\n",
-    "import pandas as pd\n",
-    "\n",
     "import ray\n",
     "from ray.train.batch_predictor import BatchPredictor\n",
     "from ray.train.lightgbm import LightGBMPredictor\n",
@@ -56,9 +52,8 @@
     "from ray.train.lightgbm import LightGBMTrainer\n",
     "from ray.data.dataset import Dataset\n",
     "from ray.air.result import Result\n",
-    "from ray.data.preprocessors import StandardScaler\n",
-    "from sklearn.datasets import load_breast_cancer\n",
-    "from sklearn.model_selection import train_test_split"
+    "from ray.air.util.datasets import train_test_split\n",
+    "from ray.data.preprocessors import StandardScaler"
    ]
   },
   {
@@ -71,24 +66,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 13,
    "id": "f1f35cd7",
    "metadata": {},
    "outputs": [],
    "source": [
     "def prepare_data() -> Tuple[Dataset, Dataset, Dataset]:\n",
-    "    data_raw = load_breast_cancer()\n",
-    "    dataset_df = pd.DataFrame(data_raw[\"data\"], columns=data_raw[\"feature_names\"])\n",
-    "    dataset_df[\"target\"] = data_raw[\"target\"]\n",
-    "    # add a random categorical column\n",
-    "    num_samples = len(dataset_df)\n",
-    "    dataset_df[\"categorical_column\"] = pd.Series(\n",
-    "        ([\"A\", \"B\"] * math.ceil(num_samples / 2))[:num_samples]\n",
-    "    )\n",
-    "    train_df, test_df = train_test_split(dataset_df, test_size=0.3)\n",
-    "    train_dataset = ray.data.from_pandas(train_df)\n",
-    "    valid_dataset = ray.data.from_pandas(test_df)\n",
-    "    test_dataset = ray.data.from_pandas(test_df.drop(\"target\", axis=1))\n",
+    "    dataset = ray.data.read_csv(\"s3://air-example-data/breast_cancer_with_categorical.csv\")\n",
+    "    train_dataset, valid_dataset = train_test_split(dataset, test_size=0.3)\n",
+    "    test_dataset = valid_dataset.map_batches(lambda df: df.drop(\"target\", axis=1), batch_format=\"pandas\")\n",
     "    return train_dataset, valid_dataset, test_dataset"
    ]
   },
@@ -102,7 +88,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 14,
    "id": "fefcbc8a",
    "metadata": {},
    "outputs": [],
@@ -150,7 +136,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 15,
    "id": "3f1d0c19",
    "metadata": {},
    "outputs": [],
@@ -164,14 +150,13 @@
     "    predicted_labels = (\n",
     "        batch_predictor.predict(test_dataset)\n",
     "        .map_batches(lambda df: (df > 0.5).astype(int), batch_format=\"pandas\")\n",
-    "        .to_pandas(limit=float(\"inf\"))\n",
     "    )\n",
-    "    print(f\"PREDICTED LABELS\\n{predicted_labels}\")\n",
+    "    print(f\"PREDICTED LABELS\")\n",
+    "    predicted_labels.show()\n",
     "\n",
-    "    shap_values = batch_predictor.predict(test_dataset, pred_contrib=True).to_pandas(\n",
-    "        limit=float(\"inf\")\n",
-    "    )\n",
-    "    print(f\"SHAP VALUES\\n{shap_values}\")"
+    "    shap_values = batch_predictor.predict(test_dataset, pred_contrib=True)\n",
+    "    print(f\"SHAP VALUES\")\n",
+    "    shap_values.show()"
    ]
   },
   {
@@ -184,7 +169,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 16,
    "id": "8244ff3c",
    "metadata": {},
    "outputs": [
@@ -192,18 +177,19 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-19 11:18:27,652\tINFO services.py:1483 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8265\u001b[39m\u001b[22m\n"
+      "2022-06-22 17:26:41,346\tWARNING read_api.py:260 -- The number of blocks in this dataset (1) limits its parallelism to 1 concurrent tasks. This is much less than the number of available CPU slots in the cluster. Use `.repartition(n)` to increase the number of dataset blocks.\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 46.26it/s]\n"
      ]
     },
     {
      "data": {
       "text/html": [
-       "== Status ==<br>Current time: 2022-05-19 11:18:47 (running for 00:00:15.19)<br>Memory usage on this node: 10.2/16.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/4.86 GiB heap, 0.0/2.0 GiB objects<br>Result logdir: /Users/kai/ray_results/LightGBMTrainer_2022-05-19_11-18-30<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
+       "== Status ==<br>Current time: 2022-06-22 17:26:56 (running for 00:00:14.07)<br>Memory usage on this node: 10.0/31.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/8 CPUs, 0/0 GPUs, 0.0/13.32 GiB heap, 0.0/6.66 GiB objects<br>Result logdir: /home/ubuntu/ray_results/LightGBMTrainer_2022-06-22_17-26-41<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
        "<thead>\n",
-       "<tr><th>Trial name                 </th><th>status    </th><th>loc           </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  train-binary_logloss</th><th style=\"text-align: right;\">  train-binary_error</th><th style=\"text-align: right;\">  valid-binary_logloss</th></tr>\n",
+       "<tr><th>Trial name                 </th><th>status    </th><th>loc                  </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  train-binary_logloss</th><th style=\"text-align: right;\">  train-binary_error</th><th style=\"text-align: right;\">  valid-binary_logloss</th></tr>\n",
        "</thead>\n",
        "<tbody>\n",
-       "<tr><td>LightGBMTrainer_07bf3_00000</td><td>TERMINATED</td><td>127.0.0.1:9219</td><td style=\"text-align: right;\">   100</td><td style=\"text-align: right;\">         10.4622</td><td style=\"text-align: right;\">           0.000197893</td><td style=\"text-align: right;\">                   0</td><td style=\"text-align: right;\">              0.289033</td></tr>\n",
+       "<tr><td>LightGBMTrainer_7b049_00000</td><td>TERMINATED</td><td>172.31.43.110:1491578</td><td style=\"text-align: right;\">   100</td><td style=\"text-align: right;\">         10.9726</td><td style=\"text-align: right;\">           0.000574522</td><td style=\"text-align: right;\">                   0</td><td style=\"text-align: right;\">              0.171898</td></tr>\n",
        "</tbody>\n",
        "</table><br><br>"
       ],
@@ -219,96 +205,139 @@
      "output_type": "stream",
      "text": [
       "UserWarning: cpus_per_actor is set to less than 2. Distributed LightGBM needs at least 2 CPUs per actor to train efficiently. This may lead to a degradation of performance during training.\n",
-      "\u001b[2m\u001b[33m(raylet)\u001b[0m 2022-05-19 11:18:32,940\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=51840 --object-store-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=56443 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58688 --redis-password=5241590000000000 --startup-token=16 --runtime-env-hash=-2010331134\n",
-      "\u001b[2m\u001b[33m(raylet)\u001b[0m 2022-05-19 11:18:36,664\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=51840 --object-store-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=56443 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58688 --redis-password=5241590000000000 --startup-token=17 --runtime-env-hash=-2010331069\n",
-      "\u001b[2m\u001b[36m(GBDTTrainable pid=9219)\u001b[0m UserWarning: Dataset 'train' has 1 blocks, which is less than the `num_workers` 2. This dataset will be automatically repartitioned to 2 blocks.\n",
-      "\u001b[2m\u001b[36m(GBDTTrainable pid=9219)\u001b[0m UserWarning: Dataset 'valid' has 1 blocks, which is less than the `num_workers` 2. This dataset will be automatically repartitioned to 2 blocks.\n",
-      "\u001b[2m\u001b[36m(GBDTTrainable pid=9219)\u001b[0m UserWarning: cpus_per_actor is set to less than 2. Distributed LightGBM needs at least 2 CPUs per actor to train efficiently. This may lead to a degradation of performance during training.\n",
-      "\u001b[2m\u001b[33m(raylet)\u001b[0m 2022-05-19 11:18:38,980\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=51840 --object-store-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=56443 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58688 --redis-password=5241590000000000 --startup-token=18 --runtime-env-hash=-2010331069\n",
-      "\u001b[2m\u001b[33m(raylet)\u001b[0m 2022-05-19 11:18:38,997\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=51840 --object-store-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=56443 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58688 --redis-password=5241590000000000 --startup-token=19 --runtime-env-hash=-2010331069\n",
-      "\u001b[2m\u001b[33m(raylet)\u001b[0m 2022-05-19 11:18:39,091\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=51840 --object-store-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=56443 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58688 --redis-password=5241590000000000 --startup-token=21 --runtime-env-hash=-2010331134\n",
-      "\u001b[2m\u001b[33m(raylet)\u001b[0m 2022-05-19 11:18:39,095\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=51840 --object-store-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=56443 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58688 --redis-password=5241590000000000 --startup-token=20 --runtime-env-hash=-2010331134\n",
-      "\u001b[2m\u001b[33m(raylet)\u001b[0m 2022-05-19 11:18:39,107\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=51840 --object-store-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=56443 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58688 --redis-password=5241590000000000 --startup-token=23 --runtime-env-hash=-2010331134\n",
-      "\u001b[2m\u001b[33m(raylet)\u001b[0m 2022-05-19 11:18:39,107\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=51840 --object-store-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-18-25_114449_9132/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=56443 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58688 --redis-password=5241590000000000 --startup-token=22 --runtime-env-hash=-2010331134\n"
+      "\u001b[2m\u001b[36m(pid=1491578)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491578)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491578)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491578)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491578)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491578)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491578)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491578)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(LightGBMTrainer pid=1491578)\u001b[0m UserWarning: Dataset 'train' has 1 blocks, which is less than the `num_workers` 2. This dataset will be automatically repartitioned to 2 blocks.\n",
+      "\u001b[2m\u001b[36m(LightGBMTrainer pid=1491578)\u001b[0m UserWarning: Dataset 'valid' has 1 blocks, which is less than the `num_workers` 2. This dataset will be automatically repartitioned to 2 blocks.\n",
+      "\u001b[2m\u001b[36m(LightGBMTrainer pid=1491578)\u001b[0m UserWarning: cpus_per_actor is set to less than 2. Distributed LightGBM needs at least 2 CPUs per actor to train efficiently. This may lead to a degradation of performance during training.\n",
+      "\u001b[2m\u001b[36m(pid=1491651)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491651)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(pid=1491651)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491651)\u001b[0m FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491651)\u001b[0m FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491653)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491653)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491653)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491653)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491653)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491653)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491653)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491653)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(pid=1491652)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491652)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491652)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491652)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491652)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491652)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491652)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491652)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491653)\u001b[0m 2022-06-22 17:26:50,509\tWARNING __init__.py:190 -- DeprecationWarning: `ray.worker.get_resource_ids` is a private attribute and access will be removed in a future Ray version.\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491652)\u001b[0m 2022-06-22 17:26:50,658\tWARNING __init__.py:190 -- DeprecationWarning: `ray.worker.get_resource_ids` is a private attribute and access will be removed in a future Ray version.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491653)\u001b[0m [LightGBM] [Info] Trying to bind port 59039...\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491653)\u001b[0m [LightGBM] [Info] Binding port 59039 succeeded\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491653)\u001b[0m [LightGBM] [Info] Listening...\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491652)\u001b[0m [LightGBM] [Info] Trying to bind port 46955...\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491652)\u001b[0m [LightGBM] [Info] Binding port 46955 succeeded\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491652)\u001b[0m [LightGBM] [Info] Listening...\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491652)\u001b[0m [LightGBM] [Warning] Connecting to rank 1 failed, waiting for 200 milliseconds\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491653)\u001b[0m UserWarning: Overriding the parameters from Reference Dataset.\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491653)\u001b[0m UserWarning: categorical_column in param dict is overridden.\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491652)\u001b[0m UserWarning: Overriding the parameters from Reference Dataset.\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491652)\u001b[0m UserWarning: categorical_column in param dict is overridden.\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9242)\u001b[0m [LightGBM] [Info] Trying to bind port 52127...\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9242)\u001b[0m [LightGBM] [Info] Binding port 52127 succeeded\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9242)\u001b[0m [LightGBM] [Info] Listening...\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9242)\u001b[0m [LightGBM] [Warning] Connecting to rank 1 failed, waiting for 200 milliseconds\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9243)\u001b[0m [LightGBM] [Info] Trying to bind port 52128...\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9243)\u001b[0m [LightGBM] [Info] Binding port 52128 succeeded\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9243)\u001b[0m [LightGBM] [Info] Listening...\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9242)\u001b[0m [LightGBM] [Info] Connected to rank 1\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9242)\u001b[0m [LightGBM] [Info] Local rank: 0, total number of machines: 2\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9242)\u001b[0m [LightGBM] [Warning] num_threads is set=1, n_jobs=-1 will be ignored. Current value: num_threads=1\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9243)\u001b[0m [LightGBM] [Info] Connected to rank 0\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9243)\u001b[0m [LightGBM] [Info] Local rank: 1, total number of machines: 2\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9243)\u001b[0m [LightGBM] [Warning] num_threads is set=1, n_jobs=-1 will be ignored. Current value: num_threads=1\n"
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491653)\u001b[0m [LightGBM] [Info] Connected to rank 0\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491653)\u001b[0m [LightGBM] [Info] Local rank: 1, total number of machines: 2\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491653)\u001b[0m [LightGBM] [Warning] num_threads is set=1, n_jobs=-1 will be ignored. Current value: num_threads=1\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491652)\u001b[0m [LightGBM] [Info] Connected to rank 1\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491652)\u001b[0m [LightGBM] [Info] Local rank: 0, total number of machines: 2\n",
+      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=1491652)\u001b[0m [LightGBM] [Warning] num_threads is set=1, n_jobs=-1 will be ignored. Current value: num_threads=1\n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9243)\u001b[0m UserWarning: Overriding the parameters from Reference Dataset.\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9243)\u001b[0m UserWarning: categorical_column in param dict is overridden.\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9242)\u001b[0m UserWarning: Overriding the parameters from Reference Dataset.\n",
-      "\u001b[2m\u001b[36m(_RemoteRayLightGBMActor pid=9242)\u001b[0m UserWarning: categorical_column in param dict is overridden.\n"
+      "\u001b[2m\u001b[36m(_QueueActor pid=1491650)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1491650)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1491650)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1491650)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1491650)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1491650)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1491650)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1491650)\u001b[0m   from pandas import MultiIndex, Int64Index\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Result for LightGBMTrainer_07bf3_00000:\n",
-      "  date: 2022-05-19_11-18-44\n",
+      "Result for LightGBMTrainer_7b049_00000:\n",
+      "  date: 2022-06-22_17-26-53\n",
       "  done: false\n",
-      "  experiment_id: 1d3640d1c3a743aeae7274a0ce253107\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
+      "  experiment_id: b4a87c26a7604a43baf895755d4f16b3\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 9219\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1491578\n",
       "  should_checkpoint: true\n",
-      "  time_since_restore: 8.41084909439087\n",
-      "  time_this_iter_s: 8.41084909439087\n",
-      "  time_total_s: 8.41084909439087\n",
-      "  timestamp: 1652955524\n",
+      "  time_since_restore: 8.369545459747314\n",
+      "  time_this_iter_s: 8.369545459747314\n",
+      "  time_total_s: 8.369545459747314\n",
+      "  timestamp: 1655918813\n",
       "  timesteps_since_restore: 0\n",
-      "  train-binary_error: 0.36683417085427134\n",
-      "  train-binary_logloss: 0.5804693664919086\n",
+      "  train-binary_error: 0.5175879396984925\n",
+      "  train-binary_logloss: 0.6302848981539763\n",
       "  training_iteration: 1\n",
-      "  trial_id: 07bf3_00000\n",
-      "  valid-binary_error: 0.36470588235294116\n",
-      "  valid-binary_logloss: 0.5868466345817073\n",
-      "  warmup_time: 0.004106044769287109\n",
+      "  trial_id: 7b049_00000\n",
+      "  valid-binary_error: 0.2\n",
+      "  valid-binary_logloss: 0.558752017793943\n",
+      "  warmup_time: 0.008721590042114258\n",
       "  \n",
-      "Result for LightGBMTrainer_07bf3_00000:\n",
-      "  date: 2022-05-19_11-18-46\n",
+      "Result for LightGBMTrainer_7b049_00000:\n",
+      "  date: 2022-06-22_17-26-56\n",
       "  done: true\n",
-      "  experiment_id: 1d3640d1c3a743aeae7274a0ce253107\n",
+      "  experiment_id: b4a87c26a7604a43baf895755d4f16b3\n",
       "  experiment_tag: '0'\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 100\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 9219\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1491578\n",
       "  should_checkpoint: true\n",
-      "  time_since_restore: 10.46218204498291\n",
-      "  time_this_iter_s: 0.025421857833862305\n",
-      "  time_total_s: 10.46218204498291\n",
-      "  timestamp: 1652955526\n",
+      "  time_since_restore: 10.972588300704956\n",
+      "  time_this_iter_s: 0.027977466583251953\n",
+      "  time_total_s: 10.972588300704956\n",
+      "  timestamp: 1655918816\n",
       "  timesteps_since_restore: 0\n",
       "  train-binary_error: 0.0\n",
-      "  train-binary_logloss: 0.00019789273681613937\n",
+      "  train-binary_logloss: 0.0005745220956391456\n",
       "  training_iteration: 100\n",
-      "  trial_id: 07bf3_00000\n",
+      "  trial_id: 7b049_00000\n",
       "  valid-binary_error: 0.058823529411764705\n",
-      "  valid-binary_logloss: 0.2890328865004496\n",
-      "  warmup_time: 0.004106044769287109\n",
+      "  valid-binary_logloss: 0.17189847605331432\n",
+      "  warmup_time: 0.008721590042114258\n",
       "  \n"
      ]
     },
@@ -316,14 +345,14 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-19 11:18:47,218\tINFO tune.py:753 -- Total run time: 16.87 seconds (15.17 seconds for the tuning loop).\n"
+      "2022-06-22 17:26:56,406\tINFO tune.py:734 -- Total run time: 14.73 seconds (14.06 seconds for the tuning loop).\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "{'train-binary_logloss': 0.00019789273681613937, 'train-binary_error': 0.0, 'valid-binary_logloss': 0.2890328865004496, 'valid-binary_error': 0.058823529411764705, 'time_this_iter_s': 0.025421857833862305, 'should_checkpoint': True, 'done': True, 'timesteps_total': None, 'episodes_total': None, 'training_iteration': 100, 'trial_id': '07bf3_00000', 'experiment_id': '1d3640d1c3a743aeae7274a0ce253107', 'date': '2022-05-19_11-18-46', 'timestamp': 1652955526, 'time_total_s': 10.46218204498291, 'pid': 9219, 'hostname': 'Kais-MacBook-Pro.local', 'node_ip': '127.0.0.1', 'config': {}, 'time_since_restore': 10.46218204498291, 'timesteps_since_restore': 0, 'iterations_since_restore': 100, 'warmup_time': 0.004106044769287109, 'experiment_tag': '0'}\n"
+      "{'train-binary_logloss': 0.0005745220956391456, 'train-binary_error': 0.0, 'valid-binary_logloss': 0.17189847605331432, 'valid-binary_error': 0.058823529411764705, 'time_this_iter_s': 0.027977466583251953, 'should_checkpoint': True, 'done': True, 'timesteps_total': None, 'episodes_total': None, 'training_iteration': 100, 'trial_id': '7b049_00000', 'experiment_id': 'b4a87c26a7604a43baf895755d4f16b3', 'date': '2022-06-22_17-26-56', 'timestamp': 1655918816, 'time_total_s': 10.972588300704956, 'pid': 1491578, 'hostname': 'ip-172-31-43-110', 'node_ip': '172.31.43.110', 'config': {}, 'time_since_restore': 10.972588300704956, 'timesteps_since_restore': 0, 'iterations_since_restore': 100, 'warmup_time': 0.008721590042114258, 'experiment_tag': '0'}\n"
      ]
     }
    ],
@@ -341,7 +370,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 17,
    "id": "871c9be6",
    "metadata": {},
    "outputs": [
@@ -349,8 +378,18 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "Map Progress (1 actors 1 pending): 100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1/1 [00:02<00:00,  2.21s/it]\n",
-      "Map_Batches: 100%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1/1 [00:00<00:00, 93.04it/s]\n"
+      "2022-06-22 17:26:57,517\tWARNING read_api.py:260 -- The number of blocks in this dataset (1) limits its parallelism to 1 concurrent tasks. This is much less than the number of available CPU slots in the cluster. Use `.repartition(n)` to increase the number of dataset blocks.\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 50.96it/s]\n",
+      "Map_Batches:   0%|          | 0/1 [00:00<?, ?it/s]\u001b[2m\u001b[36m(pid=1491998)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491998)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491998)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491998)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491998)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491998)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1491998)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1491998)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:02<00:00,  2.05s/it]\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 75.07it/s]\n"
      ]
     },
     {
@@ -358,27 +397,49 @@
      "output_type": "stream",
      "text": [
       "PREDICTED LABELS\n",
-      "     predictions\n",
-      "0              1\n",
-      "1              1\n",
-      "2              1\n",
-      "3              1\n",
-      "4              1\n",
-      "..           ...\n",
-      "166            1\n",
-      "167            0\n",
-      "168            1\n",
-      "169            1\n",
-      "170            1\n",
-      "\n",
-      "[171 rows x 1 columns]\n"
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "Map Progress (1 actors 1 pending): 100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1/1 [00:02<00:00,  2.20s/it]"
+      "Map_Batches:   0%|          | 0/1 [00:00<?, ?it/s]\u001b[2m\u001b[36m(pid=1492031)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492031)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1492031)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492031)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1492031)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492031)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1492031)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492031)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(pid=1492033)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492033)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1492033)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492033)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1492033)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492033)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1492033)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492033)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:02<00:00,  2.09s/it]\n"
      ]
     },
     {
@@ -386,79 +447,40 @@
      "output_type": "stream",
      "text": [
       "SHAP VALUES\n",
-      "     predictions_0  predictions_1  predictions_2  predictions_3  \\\n",
-      "0         0.089310      -0.909119       0.042819       0.002084   \n",
-      "1         0.080590      -0.961430       0.043946      -0.014364   \n",
-      "2         0.080606      -0.778903       0.067703       0.005561   \n",
-      "3         0.095129      -0.281614       0.083395       0.005946   \n",
-      "4         0.085822       0.470362       0.106340      -0.014601   \n",
-      "..             ...            ...            ...            ...   \n",
-      "166       0.095845       0.217879       0.131259       0.045455   \n",
-      "167      -0.369657      -1.825973      -0.270361      -0.005203   \n",
-      "168       0.078703       0.142254       0.069414       0.002620   \n",
-      "169       0.069391       0.226548       0.035343      -0.014900   \n",
-      "170       0.088893       0.216221       0.068534      -0.015672   \n",
-      "\n",
-      "     predictions_4  predictions_5  predictions_6  predictions_7  \\\n",
-      "0        -0.243459       0.536332      -1.275628       0.490998   \n",
-      "1         0.888434      -0.666081       0.541587       1.229128   \n",
-      "2        -0.444282      -0.886527       0.615167       1.113725   \n",
-      "3         0.292466      -0.205161       0.606795       0.971005   \n",
-      "4         0.549158      -0.405526       0.601660       0.438182   \n",
-      "..             ...            ...            ...            ...   \n",
-      "166      -0.177095       0.418596       0.649067       0.853719   \n",
-      "167       0.248983       0.327855       0.028472      -0.396260   \n",
-      "168       0.398207       0.217577       0.655739       0.779261   \n",
-      "169      -0.395022      -1.123284       0.555980       0.367841   \n",
-      "170       0.478937       0.223053      -1.091246       0.506502   \n",
-      "\n",
-      "     predictions_8  predictions_9  ...  predictions_22  predictions_23  \\\n",
-      "0         0.245076       0.145549  ...        0.635400        1.961269   \n",
-      "1        -0.344460       0.013988  ...        0.676673        1.151546   \n",
-      "2         0.179933       0.109160  ...        0.689301        1.877165   \n",
-      "3         0.172837       0.195020  ...        0.718073        1.592259   \n",
-      "4         0.182619      -0.127179  ...        0.682158        1.121333   \n",
-      "..             ...            ...  ...             ...             ...   \n",
-      "166       0.243637       0.070938  ...        0.744151        1.771634   \n",
-      "167       0.124145      -0.493628  ...       -0.541835       -2.201714   \n",
-      "168       0.179598       0.192144  ...        0.754423        1.300675   \n",
-      "169      -0.270785       0.072316  ...        0.531150        0.803271   \n",
-      "170       0.098758       0.163663  ...        0.545371        1.010722   \n",
-      "\n",
-      "     predictions_24  predictions_25  predictions_26  predictions_27  \\\n",
-      "0          0.251278        0.089320       -0.598509        1.552746   \n",
-      "1          0.284339        0.053013        0.818982        1.595459   \n",
-      "2          0.564781       -0.043412        0.613467        1.649626   \n",
-      "3          0.532693        0.070353        0.544844        1.746157   \n",
-      "4          0.311470        0.115707        1.179717        1.670017   \n",
-      "..              ...             ...             ...             ...   \n",
-      "166       -0.375872        0.127995        0.817884        1.686068   \n",
-      "167        0.625508        0.039757       -0.539761        0.908562   \n",
-      "168        0.398768        0.118736        0.736576        1.693371   \n",
-      "169        0.266529       -0.005190        0.850678        1.707049   \n",
-      "170        0.877337        0.080191       -0.588513        1.725231   \n",
-      "\n",
-      "     predictions_28  predictions_29  predictions_30  predictions_31  \n",
-      "0         -0.025840        0.106845       -0.037509        0.636929  \n",
-      "1          0.035559       -0.119623       -0.016733        0.636929  \n",
-      "2          0.043654        0.070261       -0.012863        0.636929  \n",
-      "3          0.082365        0.098007        0.024749        0.636929  \n",
-      "4          0.079768       -0.008935        0.035418        0.636929  \n",
-      "..              ...             ...             ...             ...  \n",
-      "166        0.043644       -0.044403       -0.038294        0.636929  \n",
-      "167        0.005756       -0.192442       -0.012280        0.636929  \n",
-      "168        0.054687        0.095692       -0.012863        0.636929  \n",
-      "169        0.086557       -0.104739       -0.016732        0.636929  \n",
-      "170       -0.319243        0.137260        0.023966        0.636929  \n",
-      "\n",
-      "[171 rows x 32 columns]\n"
+      "{'predictions_0': 0.006121974664714535, 'predictions_1': 0.8940294162424869, 'predictions_2': -0.013623909529011522, 'predictions_3': -0.26580572803883, 'predictions_4': 0.2897686828261492, 'predictions_5': -0.03784232120648852, 'predictions_6': 0.021865334852359534, 'predictions_7': 1.1753326094382734, 'predictions_8': -0.02525466292349231, 'predictions_9': 0.0733463992354119, 'predictions_10': 0.09191922035401615, 'predictions_11': -0.0035196096494634313, 'predictions_12': 0.20211476104388482, 'predictions_13': 0.7813488658944929, 'predictions_14': 0.10000464816891827, 'predictions_15': 0.11543593649642907, 'predictions_16': -0.009732477634862284, 'predictions_17': 0.19117650484758314, 'predictions_18': -0.17600075102817322, 'predictions_19': 0.5829434737180024, 'predictions_20': 1.4220773445509465, 'predictions_21': 0.6086211783805069, 'predictions_22': 2.0031654232526925, 'predictions_23': 0.3090376110779834, 'predictions_24': -0.21156467772251453, 'predictions_25': 0.14122943819731193, 'predictions_26': -0.1324700025487787, 'predictions_27': 0.8280650504246968, 'predictions_28': 0.03147457104755769, 'predictions_29': 0.00029604737237433516, 'predictions_30': 0.024336487839325866, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.00565090216762466, 'predictions_1': 0.7173247917145018, 'predictions_2': -0.01352989648419376, 'predictions_3': -0.204508963539279, 'predictions_4': -0.11703564338083555, 'predictions_5': 0.059858710083059874, 'predictions_6': 0.06974454296095976, 'predictions_7': 1.5952991804773315, 'predictions_8': 0.30494490847895245, 'predictions_9': 0.03770331660034111, 'predictions_10': 0.08779844216179675, 'predictions_11': 0.0001818669974550241, 'predictions_12': -0.10871732001356472, 'predictions_13': 0.49872871949407244, 'predictions_14': 0.16083030838859202, 'predictions_15': 0.4071487385487001, 'predictions_16': -0.00920287075428388, 'predictions_17': 0.21519060265555054, 'predictions_18': -0.24141319659570365, 'predictions_19': -0.19394859165532527, 'predictions_20': 1.2358452648954865, 'predictions_21': 0.16127531717942642, 'predictions_22': 1.3397755121893355, 'predictions_23': 0.24271016133964965, 'predictions_24': -0.11296858156987878, 'predictions_25': 0.21775788278030012, 'predictions_26': 0.8594002204044787, 'predictions_27': 1.0571631081079365, 'predictions_28': 0.06338809094380635, 'predictions_29': 0.14952090064808415, 'predictions_30': -0.020191656254497082, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.0011410972769028797, 'predictions_1': -0.023112580054428615, 'predictions_2': 0.0015007474035067395, 'predictions_3': -0.3960490192373774, 'predictions_4': -0.30646108596137317, 'predictions_5': -0.015606280874156383, 'predictions_6': -0.10875176916234583, 'predictions_7': -2.3253286264519457, 'predictions_8': 0.2758843675860649, 'predictions_9': 0.029091310311824298, 'predictions_10': -0.057950348636255644, 'predictions_11': -0.00017555498393944432, 'predictions_12': -0.4136454204716676, 'predictions_13': -0.3629735922139978, 'predictions_14': 0.04232756741319012, 'predictions_15': 0.06936920198392876, 'predictions_16': 0.010307144611165166, 'predictions_17': -0.4063116213440989, 'predictions_18': -0.07826460708005233, 'predictions_19': 0.28668914680505037, 'predictions_20': -2.0034181076720015, 'predictions_21': -0.4289092806234529, 'predictions_22': -2.059807308089095, 'predictions_23': -0.2625534917898286, 'predictions_24': -1.0607560950436483, 'predictions_25': -0.13241418825219023, 'predictions_26': -0.46713657128877134, 'predictions_27': -2.0707325110237127, 'predictions_28': -0.0212343580603297, 'predictions_29': -0.11761200100287779, 'predictions_30': 0.03805635018946682, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.003501920356918757, 'predictions_1': 0.9649889446638613, 'predictions_2': -0.011627077584939034, 'predictions_3': -0.33201537640627937, 'predictions_4': 0.2626117060870051, 'predictions_5': -0.0420997182498785, 'predictions_6': 0.05656763216450521, 'predictions_7': 1.076092179662977, 'predictions_8': -0.1396182169782879, 'predictions_9': -0.09872952353947571, 'predictions_10': 0.04378766056466948, 'predictions_11': 0.002478996394296549, 'predictions_12': 0.25042183813566526, 'predictions_13': 0.8751692867530225, 'predictions_14': 0.18679133739736484, 'predictions_15': 0.046846715006450504, 'predictions_16': -0.009211815518670832, 'predictions_17': 0.22485983912144494, 'predictions_18': -0.2861737431801593, 'predictions_19': -0.2533929278067911, 'predictions_20': 1.316951719635302, 'predictions_21': 1.1964971086769494, 'predictions_22': 1.2740098717427248, 'predictions_23': 0.25042580055967084, 'predictions_24': -0.4015257176668039, 'predictions_25': 0.17935395324361414, 'predictions_26': 1.126933988937795, 'predictions_27': 0.8031626612897146, 'predictions_28': 0.0771850514731471, 'predictions_29': 0.03755423306624511, 'predictions_30': -0.016833253240925238, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': -0.0034560551402153003, 'predictions_1': 0.5230708630376469, 'predictions_2': -0.015562114219360572, 'predictions_3': -0.1196402194436373, 'predictions_4': 0.4106482044292619, 'predictions_5': 0.06220233147046589, 'predictions_6': 0.12716114707514065, 'predictions_7': 1.3356455912614509, 'predictions_8': 0.1447514882444872, 'predictions_9': 0.12370386736447751, 'predictions_10': 0.07410456355721864, 'predictions_11': 0.012016763274156357, 'predictions_12': -0.10513441936331262, 'predictions_13': 0.7484191363603289, 'predictions_14': 0.18707788149117566, 'predictions_15': 0.3327881147491029, 'predictions_16': -0.009219336794413353, 'predictions_17': -0.10065740008750416, 'predictions_18': 0.16625881614886867, 'predictions_19': 0.23084551369873454, 'predictions_20': 1.358717098613538, 'predictions_21': 0.19175435277095332, 'predictions_22': 1.3375643842995248, 'predictions_23': 0.2926283902278477, 'predictions_24': 0.1146310032943002, 'predictions_25': 0.23343399483643015, 'predictions_26': 0.6034462734909513, 'predictions_27': 0.9230214841058666, 'predictions_28': 0.029594344165258104, 'predictions_29': 0.04913153000099999, 'predictions_30': 0.02341707352913655, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': -0.005102561841927789, 'predictions_1': 1.0861119112102469, 'predictions_2': -0.0154828846564582, 'predictions_3': -0.3088905099091714, 'predictions_4': 0.05779026036152443, 'predictions_5': 0.047351932324116885, 'predictions_6': 0.0876371219806605, 'predictions_7': 1.1210466016114495, 'predictions_8': -0.1252369777517682, 'predictions_9': 0.04572512843104436, 'predictions_10': 0.09245771221086214, 'predictions_11': 0.007753500238910626, 'predictions_12': 0.2309698163766563, 'predictions_13': 0.9684988783771291, 'predictions_14': 0.024511467599608535, 'predictions_15': 0.18657179919131872, 'predictions_16': -0.009212652411079585, 'predictions_17': -0.13395842318946233, 'predictions_18': 0.152376407447391, 'predictions_19': -0.28554273302892486, 'predictions_20': 1.3994697511973517, 'predictions_21': 0.5784457048607689, 'predictions_22': 1.3325378201278, 'predictions_23': 0.30730022154186687, 'predictions_24': 0.017237427138293876, 'predictions_25': 0.19484371531419448, 'predictions_26': 1.0716212980249242, 'predictions_27': 0.7424857548065319, 'predictions_28': 0.030110335845485465, 'predictions_29': 0.08677604394991238, 'predictions_30': -0.018230914497616164, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.011026642414565658, 'predictions_1': 1.0433621693813095, 'predictions_2': -0.00702393810808943, 'predictions_3': -0.2962479861350653, 'predictions_4': 0.20838486132625483, 'predictions_5': -0.07568934141814487, 'predictions_6': 0.026798049998736986, 'predictions_7': 1.2233970557267948, 'predictions_8': -0.07215770822854156, 'predictions_9': 0.016138237086580777, 'predictions_10': 0.04908427317188252, 'predictions_11': -0.013274124641011575, 'predictions_12': -0.16059386568879297, 'predictions_13': 0.38386374312584454, 'predictions_14': -0.03476748264814593, 'predictions_15': -0.5225211720205649, 'predictions_16': -0.009220168600202043, 'predictions_17': -0.15278574495418593, 'predictions_18': 0.12911665421378546, 'predictions_19': -0.2782951415110554, 'predictions_20': 1.2470508123020512, 'predictions_21': 1.049830317708393, 'predictions_22': 2.102971796648596, 'predictions_23': 0.2851979247349288, 'predictions_24': -0.0006702647871052775, 'predictions_25': -0.11420596882801563, 'predictions_26': 1.0834575497816143, 'predictions_27': 0.8164104508549398, 'predictions_28': 0.06634783513626033, 'predictions_29': 0.10518170393387423, 'predictions_30': 0.05948635171854934, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.008846265655878418, 'predictions_1': 1.071493056050533, 'predictions_2': 0.0241002358002765, 'predictions_3': -0.2914009217752569, 'predictions_4': -0.1844514405858182, 'predictions_5': 0.09688586653158524, 'predictions_6': 0.1189004872794518, 'predictions_7': 0.019812317046639417, 'predictions_8': -0.0841879790447643, 'predictions_9': 0.0689671067023492, 'predictions_10': 0.057123796305462, 'predictions_11': 0.018751811843757425, 'predictions_12': -0.19278774516524225, 'predictions_13': 0.5521382975001031, 'predictions_14': -0.1961614983559944, 'predictions_15': 0.3352816348185536, 'predictions_16': -0.009197695434128215, 'predictions_17': -0.0600167757501572, 'predictions_18': 0.27488314466683056, 'predictions_19': -0.35962747336476697, 'predictions_20': 1.2317107478669351, 'predictions_21': 0.05530975604521487, 'predictions_22': 2.382011011440535, 'predictions_23': 0.33824065775317486, 'predictions_24': 0.3498540690011901, 'predictions_25': 0.1739274660593352, 'predictions_26': 1.160333734158511, 'predictions_27': 1.033879786485623, 'predictions_28': 0.08158573366246898, 'predictions_29': 0.10563970622307337, 'predictions_30': -0.04267793892712356, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.004750001129083867, 'predictions_1': 3.2244208404334374, 'predictions_2': 0.01622715285279811, 'predictions_3': -0.817260302999862, 'predictions_4': -0.09736090983332732, 'predictions_5': 0.07881792915896496, 'predictions_6': 0.24070898834769355, 'predictions_7': 0.05001221074373508, 'predictions_8': -0.2567854774979608, 'predictions_9': 0.03063087506346955, 'predictions_10': 0.05499599036837444, 'predictions_11': -0.015303644634305683, 'predictions_12': -0.14884606737286166, 'predictions_13': 0.8519672928318166, 'predictions_14': 0.09824149785766935, 'predictions_15': 0.26921023748269235, 'predictions_16': -0.010848751281971217, 'predictions_17': -0.11619083730523652, 'predictions_18': -0.17527472428145596, 'predictions_19': -0.5874677933384177, 'predictions_20': -0.3990904299729458, 'predictions_21': 2.2068328291797936, 'predictions_22': -1.932202847332452, 'predictions_23': -0.3152964245377162, 'predictions_24': 0.7834452171983805, 'predictions_25': 0.2512128072560273, 'predictions_26': -0.6206434154152907, 'predictions_27': 0.08708205787374604, 'predictions_28': 0.040648951231987765, 'predictions_29': 0.06879586583909683, 'predictions_30': 0.043515107484221424, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': -0.011027810657660349, 'predictions_1': -0.5337191669392997, 'predictions_2': -0.0026033241771052282, 'predictions_3': -0.2382336633486158, 'predictions_4': 0.8615636351404935, 'predictions_5': 0.059347121609268944, 'predictions_6': 0.14253423982272048, 'predictions_7': 1.4462830393121449, 'predictions_8': -0.06536550111076092, 'predictions_9': 0.12249420022849346, 'predictions_10': -0.040845467674169966, 'predictions_11': 0.03619973926410233, 'predictions_12': -0.14839345664605622, 'predictions_13': -0.38765958181699983, 'predictions_14': 0.45137385893985227, 'predictions_15': 0.4818261473751218, 'predictions_16': 0.005229328958126197, 'predictions_17': -0.14927291449462546, 'predictions_18': 0.12257473692108792, 'predictions_19': 0.5775523654869467, 'predictions_20': 1.4945158847763393, 'predictions_21': -0.11572127634540279, 'predictions_22': 1.2803791500605577, 'predictions_23': 0.2519454034779557, 'predictions_24': 0.12639705427540554, 'predictions_25': 0.20374090734634412, 'predictions_26': 0.9872077234715891, 'predictions_27': 1.1931782325388345, 'predictions_28': 0.07647609206107736, 'predictions_29': 0.017535160650109134, 'predictions_30': -0.011152247353355573, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': -0.009236814888869137, 'predictions_1': -0.08974532751806996, 'predictions_2': -0.005072446447076212, 'predictions_3': -0.49454476931590674, 'predictions_4': -0.14583165960960504, 'predictions_5': 0.037743362980294, 'predictions_6': -0.09071218034159645, 'predictions_7': -2.076157655204495, 'predictions_8': 0.6915530135596496, 'predictions_9': 0.015305309316520455, 'predictions_10': -0.05407297473599998, 'predictions_11': -0.01202689608724274, 'predictions_12': -0.37048240770136764, 'predictions_13': -1.1222567180136822, 'predictions_14': 0.037999849333804875, 'predictions_15': 0.05179781531623324, 'predictions_16': -0.009442169563784072, 'predictions_17': -0.3518926772423797, 'predictions_18': -0.18168464537700557, 'predictions_19': -0.246308669315598, 'predictions_20': -1.8215267653197431, 'predictions_21': -0.16464307910939846, 'predictions_22': -2.294068720859334, 'predictions_23': -0.3304406806357679, 'predictions_24': -0.8059935139116144, 'predictions_25': -0.15473187742974112, 'predictions_26': -0.44492987082868113, 'predictions_27': -1.706574981012038, 'predictions_28': 0.009928350750753007, 'predictions_29': -0.005531569126011125, 'predictions_30': 0.03400893184303606, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.002893918337539625, 'predictions_1': 0.6953965947651528, 'predictions_2': -0.013300368855470382, 'predictions_3': -0.15693491782098012, 'predictions_4': 0.4052561639196121, 'predictions_5': -0.01785344804083238, 'predictions_6': 0.19406598570732034, 'predictions_7': 1.5796202341560919, 'predictions_8': 0.28954821935673325, 'predictions_9': -0.215897797520852, 'predictions_10': 0.05835282036206641, 'predictions_11': 0.03331176153763488, 'predictions_12': -0.10112958834294049, 'predictions_13': 0.3947745629125056, 'predictions_14': 0.22909135741673778, 'predictions_15': 0.473005657256218, 'predictions_16': -0.009633689567643305, 'predictions_17': -0.09362381604913257, 'predictions_18': 0.14969971629912343, 'predictions_19': -0.1688864705396212, 'predictions_20': 1.3001215347067874, 'predictions_21': -0.21918668227485943, 'predictions_22': 1.3437058168797267, 'predictions_23': 0.3124907025891718, 'predictions_24': 0.14131080537131419, 'predictions_25': 0.2243700411172835, 'predictions_26': 0.9296630907535046, 'predictions_27': 0.41471504174869356, 'predictions_28': 0.020173572275052214, 'predictions_29': 0.04820465228613692, 'predictions_30': -0.020545384469295942, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.0019388150699810927, 'predictions_1': 0.9223705632364128, 'predictions_2': -0.012007685883043798, 'predictions_3': -0.31903137131372966, 'predictions_4': 0.628481905867853, 'predictions_5': -0.06149389221971728, 'predictions_6': 0.07061611794203079, 'predictions_7': 1.3823056189088423, 'predictions_8': -0.133343124664483, 'predictions_9': 0.11603949252367812, 'predictions_10': 0.21857476218484376, 'predictions_11': 0.015902798791774055, 'predictions_12': 0.2913666065699202, 'predictions_13': 0.9315294837553827, 'predictions_14': 0.277372510153019, 'predictions_15': -0.5071083100622337, 'predictions_16': -0.009631147961094873, 'predictions_17': 0.23976024706824375, 'predictions_18': -0.20540519019181294, 'predictions_19': -0.2450413530123813, 'predictions_20': 1.1789579806256083, 'predictions_21': -1.5177833757024324, 'predictions_22': 1.4604002248277352, 'predictions_23': 0.27531878725283415, 'predictions_24': -1.352094841156462, 'predictions_25': 0.16870219247146698, 'predictions_26': 1.2263320807717468, 'predictions_27': 0.8656450275023648, 'predictions_28': 0.04415827467622267, 'predictions_29': 0.049210669003044466, 'predictions_30': 0.03485239596130599, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.003483875604996794, 'predictions_1': 0.9677217395705439, 'predictions_2': -0.01375116195045965, 'predictions_3': -0.3148394441913672, 'predictions_4': -0.2574040676795255, 'predictions_5': 0.07782351238517007, 'predictions_6': 0.09223237164727777, 'predictions_7': 1.359163521325679, 'predictions_8': -0.10520478897286097, 'predictions_9': 0.051820926250002466, 'predictions_10': 0.15651454755052202, 'predictions_11': 0.012354841533717503, 'predictions_12': 0.29314938008831337, 'predictions_13': 1.0134451429783053, 'predictions_14': 0.07334166731849916, 'predictions_15': -0.5580245806930221, 'predictions_16': -0.009637538822743917, 'predictions_17': -0.12931888564696647, 'predictions_18': -0.08985648327837921, 'predictions_19': -0.2838831478457971, 'predictions_20': 1.197739882302604, 'predictions_21': -0.14264086768498266, 'predictions_22': 2.4168915798709034, 'predictions_23': 0.35060520926622657, 'predictions_24': -0.243435195670719, 'predictions_25': 0.15680747277488985, 'predictions_26': 1.2012113470638528, 'predictions_27': 0.9897751319349664, 'predictions_28': 0.05573907097988011, 'predictions_29': 0.06252860717834312, 'predictions_30': -0.05792966463337761, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.015122615065552805, 'predictions_1': -1.1167653489947622, 'predictions_2': -0.008012147012472742, 'predictions_3': -0.20874221256644707, 'predictions_4': 0.4252072619730782, 'predictions_5': 0.0038900875799020296, 'predictions_6': 0.1140119630004244, 'predictions_7': 1.1987104625838227, 'predictions_8': -0.0802347059616203, 'predictions_9': 0.14227487864929314, 'predictions_10': 0.061570146412656145, 'predictions_11': -0.0013235117361348366, 'predictions_12': 0.22496427871452854, 'predictions_13': 0.6826705611065566, 'predictions_14': 0.331084179340632, 'predictions_15': 0.2325873510907064, 'predictions_16': -0.005890948415758354, 'predictions_17': 0.23108082656181192, 'predictions_18': 0.08866538976848874, 'predictions_19': 0.5251741787977718, 'predictions_20': 1.5307505517513718, 'predictions_21': -0.07014338016238107, 'predictions_22': 1.8024293796373567, 'predictions_23': 0.3420427562962711, 'predictions_24': -0.3356060347979862, 'predictions_25': 0.08823113765567157, 'predictions_26': 0.9993112240252872, 'predictions_27': 1.1583364010362838, 'predictions_28': 0.05818942683648322, 'predictions_29': -0.010171113593323115, 'predictions_30': 0.017500344327137828, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.00510007523648401, 'predictions_1': -1.8438586845336085, 'predictions_2': 0.07034588660781765, 'predictions_3': -0.6334911581627888, 'predictions_4': 0.9114601232034509, 'predictions_5': 0.015641139153578926, 'predictions_6': 0.3391581513516312, 'predictions_7': 0.015993612058473987, 'predictions_8': 0.4979057135726034, 'predictions_9': 0.14140896753303245, 'predictions_10': 0.03348118561743431, 'predictions_11': 0.018019313387541973, 'predictions_12': -0.1851865976812716, 'predictions_13': 0.18463673035754868, 'predictions_14': 0.3321862529567762, 'predictions_15': 0.4582953091852766, 'predictions_16': -0.023872509230380146, 'predictions_17': -0.05714457269664822, 'predictions_18': 0.1677010761064405, 'predictions_19': 0.6590215547332258, 'predictions_20': -0.4470726570372422, 'predictions_21': -1.2957188152033094, 'predictions_22': -0.49568168502602117, 'predictions_23': -0.5319175224432703, 'predictions_24': 0.8792904089758667, 'predictions_25': -0.16764333932557407, 'predictions_26': -0.5006140094263773, 'predictions_27': -0.559662593948684, 'predictions_28': 0.009575432219475658, 'predictions_29': 0.03620587401831965, 'predictions_30': -0.022617768077518082, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': -0.0035275503865915213, 'predictions_1': -1.7572879984733045, 'predictions_2': 0.02112961345058588, 'predictions_3': -0.5373126141152578, 'predictions_4': 0.8167634172202621, 'predictions_5': -0.04568688093881375, 'predictions_6': 0.25612518616907237, 'predictions_7': 1.6585574657259259, 'predictions_8': 0.5708485569128593, 'predictions_9': -0.2579041111541445, 'predictions_10': -0.02303431468406031, 'predictions_11': 0.0294850340796527, 'predictions_12': -0.20150167754729115, 'predictions_13': -0.3122660955180186, 'predictions_14': 0.08946441512158586, 'predictions_15': 0.19599051996984723, 'predictions_16': -0.007048153187921441, 'predictions_17': -0.10443059840913398, 'predictions_18': 0.14693551914712497, 'predictions_19': -0.2646088763947528, 'predictions_20': -0.14423328554566225, 'predictions_21': -1.096484854939204, 'predictions_22': -0.5409155996124657, 'predictions_23': -0.2125528115678197, 'predictions_24': 0.2028301059851276, 'predictions_25': 0.15076353496237724, 'predictions_26': 1.863813974679114, 'predictions_27': 1.2625204294969739, 'predictions_28': -0.009542569876103744, 'predictions_29': 0.08892200769099384, 'predictions_30': 0.016344768954324324, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.009144654047150176, 'predictions_1': 0.3616068989438007, 'predictions_2': -0.009713127697925978, 'predictions_3': -0.25503380890174077, 'predictions_4': -0.08841376708924753, 'predictions_5': 0.12905387860630704, 'predictions_6': 0.09872550234229752, 'predictions_7': 1.5461380270279617, 'predictions_8': 0.5934142135359506, 'predictions_9': 0.04672843933802434, 'predictions_10': 0.017982350366210965, 'predictions_11': 0.011836524186964618, 'predictions_12': -0.09329132650766998, 'predictions_13': 0.9816979966957412, 'predictions_14': -0.26131805604494435, 'predictions_15': 0.2573728246698596, 'predictions_16': -0.009616853447343936, 'predictions_17': -0.11778440476199589, 'predictions_18': 0.19894108953925974, 'predictions_19': -0.28976560140618507, 'predictions_20': 1.145755494068452, 'predictions_21': 0.19170884942775918, 'predictions_22': 1.751619931359333, 'predictions_23': 0.31591084941785597, 'predictions_24': -0.9883146017669252, 'predictions_25': 0.3832169744602564, 'predictions_26': 1.3459027320296548, 'predictions_27': 1.0895032649194054, 'predictions_28': 0.054326669111151096, 'predictions_29': 0.11224841710144848, 'predictions_30': -0.01934243236389702, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.05414474380600745, 'predictions_1': -1.149372263278166, 'predictions_2': -0.0034542658503694534, 'predictions_3': -0.11226127026369175, 'predictions_4': -0.2765479593192703, 'predictions_5': 0.057605254673602974, 'predictions_6': 0.04807218948118946, 'predictions_7': 1.627632661158546, 'predictions_8': 0.23594239851080898, 'predictions_9': 0.08102266882022441, 'predictions_10': -0.035797597595999694, 'predictions_11': -0.006940512375528646, 'predictions_12': -0.10341465914545066, 'predictions_13': 0.27134162901025793, 'predictions_14': -0.4589675261254597, 'predictions_15': 0.16906923946657362, 'predictions_16': -0.005805030106413082, 'predictions_17': -0.11670739934889805, 'predictions_18': 0.270439579413901, 'predictions_19': 0.2757024597749045, 'predictions_20': 1.2679444783850085, 'predictions_21': -1.2185063190204835, 'predictions_22': 2.6862730600162457, 'predictions_23': 0.45079291995440945, 'predictions_24': -0.8576927701312551, 'predictions_25': 0.1825880636881889, 'predictions_26': 0.9481775337394789, 'predictions_27': 1.3019845783662138, 'predictions_28': 0.03309325718132554, 'predictions_29': 0.037279537345320794, 'predictions_30': 0.030849407280271066, 'predictions_31': 1.5201632854544105}\n",
+      "{'predictions_0': 0.026701912078513444, 'predictions_1': -0.016049183561005216, 'predictions_2': -0.026512557715316794, 'predictions_3': -0.33992007086017256, 'predictions_4': -0.3231034954783173, 'predictions_5': 0.020522588667874812, 'predictions_6': -0.09818245278711138, 'predictions_7': -1.9632581054922957, 'predictions_8': 0.2796715168175009, 'predictions_9': 0.025963248780199805, 'predictions_10': -0.13243884691329014, 'predictions_11': -0.007600341414574132, 'predictions_12': -0.3505614312588073, 'predictions_13': -0.8449241022454159, 'predictions_14': -0.0623541831245574, 'predictions_15': 0.11533014973600747, 'predictions_16': 0.008322220108907262, 'predictions_17': -0.02930862278171467, 'predictions_18': 0.02496960430979726, 'predictions_19': 0.3997160251519232, 'predictions_20': -2.0119476119311948, 'predictions_21': -0.3601922717542553, 'predictions_22': -2.240466883625807, 'predictions_23': -0.24430626245778664, 'predictions_24': -0.732571668183472, 'predictions_25': -0.14435610495492934, 'predictions_26': -0.4186367055351456, 'predictions_27': -1.7801593987201698, 'predictions_28': 0.014498054148804375, 'predictions_29': -0.10768829118597369, 'predictions_30': -0.02172472974992555, 'predictions_31': 1.5201632854544105}\n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\n"
+      "\u001b[2m\u001b[36m(pid=1492090)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492090)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1492090)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492090)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1492090)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/dask/dataframe/backends.py:181: FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492090)\u001b[0m   _numeric_index_types = (pd.Int64Index, pd.Float64Index, pd.UInt64Index)\n",
+      "\u001b[2m\u001b[36m(pid=1492090)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1492090)\u001b[0m   from pandas import MultiIndex, Int64Index\n"
      ]
     }
    ],
@@ -474,7 +496,7 @@
    "notebook_metadata_filter": "-all"
   },
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "Python 3.8.10 ('venv': venv)",
    "language": "python",
    "name": "python3"
   },
@@ -488,7 +510,12 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.10"
+  },
+  "vscode": {
+   "interpreter": {
+    "hash": "3c0d54d489a08ae47a06eae2fd00ff032d6cddb527c382959b7b2575f6a8167f"
+   }
   }
  },
  "nbformat": 4,
diff --git a/doc/source/ray-air/examples/sklearn_example.ipynb b/doc/source/ray-air/examples/sklearn_example.ipynb
index e085d01ab44e..833aa18534b0 100644
--- a/doc/source/ray-air/examples/sklearn_example.ipynb
+++ b/doc/source/ray-air/examples/sklearn_example.ipynb
@@ -19,7 +19,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": null,
    "id": "88f4bb39",
    "metadata": {
     "pycharm": {
@@ -41,16 +41,13 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 9,
    "id": "c02eb5cd",
    "metadata": {},
    "outputs": [],
    "source": [
-    "import argparse\n",
-    "import math\n",
     "from typing import Tuple\n",
     "\n",
-    "import pandas as pd\n",
     "\n",
     "import ray\n",
     "from ray.data.dataset import Dataset\n",
@@ -58,12 +55,10 @@
     "from ray.train.sklearn import SklearnPredictor\n",
     "from ray.data.preprocessors import Chain, OrdinalEncoder, StandardScaler\n",
     "from ray.air.result import Result\n",
+    "from ray.air.util.datasets import train_test_split\n",
     "from ray.train.sklearn import SklearnTrainer\n",
     "\n",
-    "\n",
-    "from sklearn.datasets import load_breast_cancer\n",
     "from sklearn.ensemble import RandomForestClassifier\n",
-    "from sklearn.model_selection import train_test_split\n",
     "\n",
     "try:\n",
     "    from cuml.ensemble import RandomForestClassifier as cuMLRandomForestClassifier\n",
@@ -81,24 +76,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 10,
    "id": "3631ed1e",
    "metadata": {},
    "outputs": [],
    "source": [
     "def prepare_data() -> Tuple[Dataset, Dataset, Dataset]:\n",
-    "    data_raw = load_breast_cancer()\n",
-    "    dataset_df = pd.DataFrame(data_raw[\"data\"], columns=data_raw[\"feature_names\"])\n",
-    "    dataset_df[\"target\"] = data_raw[\"target\"]\n",
-    "    # add a random categorical column\n",
-    "    num_samples = len(dataset_df)\n",
-    "    dataset_df[\"categorical_column\"] = pd.Series(\n",
-    "        ([\"A\", \"B\"] * math.ceil(num_samples / 2))[:num_samples]\n",
-    "    )\n",
-    "    train_df, test_df = train_test_split(dataset_df, test_size=0.3)\n",
-    "    train_dataset = ray.data.from_pandas(train_df)\n",
-    "    valid_dataset = ray.data.from_pandas(test_df)\n",
-    "    test_dataset = ray.data.from_pandas(test_df.drop(\"target\", axis=1))\n",
+    "    dataset = ray.data.read_csv(\"s3://air-example-data/breast_cancer_with_categorical.csv\")\n",
+    "    train_dataset, valid_dataset = train_test_split(dataset, test_size=0.3)\n",
+    "    test_dataset = valid_dataset.map_batches(lambda df: df.drop(\"target\", axis=1), batch_format=\"pandas\")\n",
     "    return train_dataset, valid_dataset, test_dataset"
    ]
   },
@@ -112,7 +98,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 11,
    "id": "0fd39e42",
    "metadata": {},
    "outputs": [],
@@ -162,7 +148,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 12,
    "id": "59eeadd8",
    "metadata": {},
    "outputs": [],
@@ -180,9 +166,9 @@
     "            num_gpus_per_worker=int(use_gpu),\n",
     "        )\n",
     "        .map_batches(lambda df: (df > 0.5).astype(int), batch_format=\"pandas\")\n",
-    "        .to_pandas(limit=float(\"inf\"))\n",
     "    )\n",
-    "    print(f\"PREDICTED LABELS\\n{predicted_labels}\")"
+    "    print(f\"PREDICTED LABELS\")\n",
+    "    predicted_labels.show()"
    ]
   },
   {
@@ -195,7 +181,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 13,
    "id": "43f9170a",
    "metadata": {},
    "outputs": [
@@ -203,18 +189,20 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-19 11:56:26,664\tINFO services.py:1483 -- View the Ray dashboard at \u001B[1m\u001B[32mhttp://127.0.0.1:8266\u001B[39m\u001B[22m\n"
+      "2022-06-22 17:27:37,741\tINFO services.py:1477 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8269\u001b[39m\u001b[22m\n",
+      "2022-06-22 17:27:39,822\tWARNING read_api.py:260 -- The number of blocks in this dataset (1) limits its parallelism to 1 concurrent tasks. This is much less than the number of available CPU slots in the cluster. Use `.repartition(n)` to increase the number of dataset blocks.\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 44.05it/s]\n"
      ]
     },
     {
      "data": {
       "text/html": [
-       "== Status ==<br>Current time: 2022-05-19 11:56:51 (running for 00:00:20.56)<br>Memory usage on this node: 10.1/16.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/4.64 GiB heap, 0.0/2.0 GiB objects<br>Result logdir: /Users/kai/ray_results/SklearnTrainer_2022-05-19_11-56-29<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
+       "== Status ==<br>Current time: 2022-06-22 17:27:59 (running for 00:00:18.31)<br>Memory usage on this node: 10.7/31.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/8 CPUs, 0/0 GPUs, 0.0/12.9 GiB heap, 0.0/6.45 GiB objects<br>Result logdir: /home/ubuntu/ray_results/SklearnTrainer_2022-06-22_17-27-40<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
        "<thead>\n",
-       "<tr><th>Trial name                </th><th>status    </th><th>loc            </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  fit_time</th></tr>\n",
+       "<tr><th>Trial name                </th><th>status    </th><th>loc                  </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  fit_time</th></tr>\n",
        "</thead>\n",
        "<tbody>\n",
-       "<tr><td>SklearnTrainer_564d9_00000</td><td>TERMINATED</td><td>127.0.0.1:12221</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">         17.1905</td><td style=\"text-align: right;\">   2.48662</td></tr>\n",
+       "<tr><td>SklearnTrainer_9dec8_00000</td><td>TERMINATED</td><td>172.31.43.110:1492629</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">         15.6842</td><td style=\"text-align: right;\">   2.31571</td></tr>\n",
        "</tbody>\n",
        "</table><br><br>"
       ],
@@ -229,127 +217,107 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:31,837\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=16 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:34,848\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=17 --runtime-env-hash=-2010331069\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m 2022-05-19 11:56:36,385\tWARNING pool.py:591 -- The 'context' argument is not supported using ray. Please refer to the documentation for how to control ray initialization.\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:37,344\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=19 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:37,344\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=18 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:39,843\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=21 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:39,845\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=20 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:42,324\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=23 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:42,324\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=22 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:44,748\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=24 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:44,749\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=25 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:47,193\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=27 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:47,193\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=26 --runtime-env-hash=-2010331134\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:49,612\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=28 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:56:49,612\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=55845 --object-store-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-56-23_998044_12148/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=59341 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:58305 --redis-password=5241590000000000 --startup-token=29 --runtime-env-hash=-2010331134\n"
+      "\u001b[2m\u001b[36m(SklearnTrainer pid=1492629)\u001b[0m 2022-06-22 17:27:45,647\tWARNING pool.py:591 -- The 'context' argument is not supported using ray. Please refer to the documentation for how to control ray initialization.\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Result for SklearnTrainer_564d9_00000:\n",
+      "Result for SklearnTrainer_9dec8_00000:\n",
       "  cv:\n",
       "    fit_time:\n",
-      "    - 2.402121067047119\n",
-      "    - 2.312839984893799\n",
-      "    - 2.3265390396118164\n",
-      "    - 2.325679063796997\n",
-      "    - 2.3602960109710693\n",
-      "    fit_time_mean: 2.34549503326416\n",
-      "    fit_time_std: 0.032384969255539235\n",
+      "    - 2.221003770828247\n",
+      "    - 2.215489387512207\n",
+      "    - 2.2075674533843994\n",
+      "    - 2.222351312637329\n",
+      "    - 2.312389612197876\n",
+      "    fit_time_mean: 2.235760307312012\n",
+      "    fit_time_std: 0.03866614559685742\n",
       "    score_time:\n",
-      "    - 0.10820889472961426\n",
-      "    - 0.10829401016235352\n",
-      "    - 0.10703587532043457\n",
-      "    - 0.10512709617614746\n",
-      "    - 0.10840892791748047\n",
-      "    score_time_mean: 0.10741496086120605\n",
-      "    score_time_std: 0.0012465199424455708\n",
+      "    - 0.022464990615844727\n",
+      "    - 0.0230865478515625\n",
+      "    - 0.02564835548400879\n",
+      "    - 0.029137849807739258\n",
+      "    - 0.021221637725830078\n",
+      "    score_time_mean: 0.02431187629699707\n",
+      "    score_time_std: 0.0028120522003997595\n",
       "    test_score:\n",
       "    - 0.9625\n",
-      "    - 0.8875\n",
+      "    - 0.9125\n",
+      "    - 0.9875\n",
       "    - 1.0\n",
-      "    - 0.9493670886075949\n",
-      "    - 0.9240506329113924\n",
-      "    test_score_mean: 0.9446835443037976\n",
-      "    test_score_std: 0.03766947497186954\n",
-      "  date: 2022-05-19_11-56-51\n",
+      "    - 0.9367088607594937\n",
+      "    test_score_mean: 0.9598417721518986\n",
+      "    test_score_std: 0.032128186960552516\n",
+      "  date: 2022-06-22_17-27-59\n",
       "  done: false\n",
-      "  experiment_id: 200cbc1e2b84434882732d2053ec45c2\n",
-      "  fit_time: 2.4866180419921875\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
+      "  experiment_id: f8215019c10e4a81ba2187c38e875365\n",
+      "  fit_time: 2.3157050609588623\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 12221\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1492629\n",
       "  should_checkpoint: true\n",
-      "  time_since_restore: 17.19045615196228\n",
-      "  time_this_iter_s: 17.19045615196228\n",
-      "  time_total_s: 17.19045615196228\n",
-      "  timestamp: 1652957811\n",
+      "  time_since_restore: 15.684244871139526\n",
+      "  time_this_iter_s: 15.684244871139526\n",
+      "  time_total_s: 15.684244871139526\n",
+      "  timestamp: 1655918879\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 1\n",
-      "  trial_id: 564d9_00000\n",
+      "  trial_id: 9dec8_00000\n",
       "  valid:\n",
-      "    score_time: 0.10993409156799316\n",
-      "    test_score: 0.9473684210526315\n",
-      "  warmup_time: 0.0039539337158203125\n",
+      "    score_time: 0.03549623489379883\n",
+      "    test_score: 0.9532163742690059\n",
+      "  warmup_time: 0.0057866573333740234\n",
       "  \n",
-      "Result for SklearnTrainer_564d9_00000:\n",
+      "Result for SklearnTrainer_9dec8_00000:\n",
       "  cv:\n",
       "    fit_time:\n",
-      "    - 2.402121067047119\n",
-      "    - 2.312839984893799\n",
-      "    - 2.3265390396118164\n",
-      "    - 2.325679063796997\n",
-      "    - 2.3602960109710693\n",
-      "    fit_time_mean: 2.34549503326416\n",
-      "    fit_time_std: 0.032384969255539235\n",
+      "    - 2.221003770828247\n",
+      "    - 2.215489387512207\n",
+      "    - 2.2075674533843994\n",
+      "    - 2.222351312637329\n",
+      "    - 2.312389612197876\n",
+      "    fit_time_mean: 2.235760307312012\n",
+      "    fit_time_std: 0.03866614559685742\n",
       "    score_time:\n",
-      "    - 0.10820889472961426\n",
-      "    - 0.10829401016235352\n",
-      "    - 0.10703587532043457\n",
-      "    - 0.10512709617614746\n",
-      "    - 0.10840892791748047\n",
-      "    score_time_mean: 0.10741496086120605\n",
-      "    score_time_std: 0.0012465199424455708\n",
+      "    - 0.022464990615844727\n",
+      "    - 0.0230865478515625\n",
+      "    - 0.02564835548400879\n",
+      "    - 0.029137849807739258\n",
+      "    - 0.021221637725830078\n",
+      "    score_time_mean: 0.02431187629699707\n",
+      "    score_time_std: 0.0028120522003997595\n",
       "    test_score:\n",
       "    - 0.9625\n",
-      "    - 0.8875\n",
+      "    - 0.9125\n",
+      "    - 0.9875\n",
       "    - 1.0\n",
-      "    - 0.9493670886075949\n",
-      "    - 0.9240506329113924\n",
-      "    test_score_mean: 0.9446835443037976\n",
-      "    test_score_std: 0.03766947497186954\n",
-      "  date: 2022-05-19_11-56-51\n",
+      "    - 0.9367088607594937\n",
+      "    test_score_mean: 0.9598417721518986\n",
+      "    test_score_std: 0.032128186960552516\n",
+      "  date: 2022-06-22_17-27-59\n",
       "  done: true\n",
-      "  experiment_id: 200cbc1e2b84434882732d2053ec45c2\n",
+      "  experiment_id: f8215019c10e4a81ba2187c38e875365\n",
       "  experiment_tag: '0'\n",
-      "  fit_time: 2.4866180419921875\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
+      "  fit_time: 2.3157050609588623\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 12221\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1492629\n",
       "  should_checkpoint: true\n",
-      "  time_since_restore: 17.19045615196228\n",
-      "  time_this_iter_s: 17.19045615196228\n",
-      "  time_total_s: 17.19045615196228\n",
-      "  timestamp: 1652957811\n",
+      "  time_since_restore: 15.684244871139526\n",
+      "  time_this_iter_s: 15.684244871139526\n",
+      "  time_total_s: 15.684244871139526\n",
+      "  timestamp: 1655918879\n",
       "  timesteps_since_restore: 0\n",
       "  training_iteration: 1\n",
-      "  trial_id: 564d9_00000\n",
+      "  trial_id: 9dec8_00000\n",
       "  valid:\n",
-      "    score_time: 0.10993409156799316\n",
-      "    test_score: 0.9473684210526315\n",
-      "  warmup_time: 0.0039539337158203125\n",
+      "    score_time: 0.03549623489379883\n",
+      "    test_score: 0.9532163742690059\n",
+      "  warmup_time: 0.0057866573333740234\n",
       "  \n"
      ]
     },
@@ -357,28 +325,14 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m /Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/joblib/externals/loky/backend/resource_tracker.py:320: UserWarning: resource_tracker: There appear to be 6 leaked folder objects to clean up at shutdown\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m   (len(rtype_registry), rtype))\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m /Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/joblib/externals/loky/backend/resource_tracker.py:333: UserWarning: resource_tracker: /var/folders/b2/0_91bd757rz02lrmr920v0gw0000gn/T/joblib_memmapping_folder_12221_5f6216ae1e6a46ba9d419e794af5d6af_23c04cd6260143c0ac6f5dbe654ee805: FileNotFoundError(2, 'No such file or directory')\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m   warnings.warn('resource_tracker: %s: %r' % (name, e))\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m /Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/joblib/externals/loky/backend/resource_tracker.py:333: UserWarning: resource_tracker: /var/folders/b2/0_91bd757rz02lrmr920v0gw0000gn/T/joblib_memmapping_folder_12221_a9bc9a60f53a487e91b551aaace31955_1d562711c03e42ff9f97698134ab33f7: FileNotFoundError(2, 'No such file or directory')\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m   warnings.warn('resource_tracker: %s: %r' % (name, e))\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m /Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/joblib/externals/loky/backend/resource_tracker.py:333: UserWarning: resource_tracker: /var/folders/b2/0_91bd757rz02lrmr920v0gw0000gn/T/joblib_memmapping_folder_12221_4130f87b8a7a41d4bb44d3ff87c47d73_d3df48add59547d89737f42c03172fa5: FileNotFoundError(2, 'No such file or directory')\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m   warnings.warn('resource_tracker: %s: %r' % (name, e))\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m /Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/joblib/externals/loky/backend/resource_tracker.py:333: UserWarning: resource_tracker: /var/folders/b2/0_91bd757rz02lrmr920v0gw0000gn/T/joblib_memmapping_folder_12221_28d4366efda3422c93d8ad3a8d66986e_9d1ab8d6a92146829caf48550752190d: FileNotFoundError(2, 'No such file or directory')\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m   warnings.warn('resource_tracker: %s: %r' % (name, e))\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m /Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/joblib/externals/loky/backend/resource_tracker.py:333: UserWarning: resource_tracker: /var/folders/b2/0_91bd757rz02lrmr920v0gw0000gn/T/joblib_memmapping_folder_12221_4dc9b4c717294776b8162f30cc5eb4fe_068611691a404ca18d46ab1be089bc5a: FileNotFoundError(2, 'No such file or directory')\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m   warnings.warn('resource_tracker: %s: %r' % (name, e))\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m /Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/joblib/externals/loky/backend/resource_tracker.py:333: UserWarning: resource_tracker: /var/folders/b2/0_91bd757rz02lrmr920v0gw0000gn/T/joblib_memmapping_folder_12221_0b60850fd8704b0e83f6c2758d9c1f2a_6ae1cfa0a68741b8b71f28a262bd7f7a: FileNotFoundError(2, 'No such file or directory')\n",
-      "\u001B[2m\u001B[36m(TrainTrainable pid=12221)\u001B[0m   warnings.warn('resource_tracker: %s: %r' % (name, e))\n",
-      "2022-05-19 11:56:51,305\tINFO tune.py:753 -- Total run time: 21.67 seconds (20.55 seconds for the tuning loop).\n"
+      "2022-06-22 17:27:59,333\tINFO tune.py:734 -- Total run time: 19.09 seconds (18.31 seconds for the tuning loop).\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "{'valid': {'score_time': 0.10993409156799316, 'test_score': 0.9473684210526315}, 'cv': {'fit_time': array([2.40212107, 2.31283998, 2.32653904, 2.32567906, 2.36029601]), 'score_time': array([0.10820889, 0.10829401, 0.10703588, 0.1051271 , 0.10840893]), 'test_score': array([0.9625    , 0.8875    , 1.        , 0.94936709, 0.92405063]), 'fit_time_mean': 2.34549503326416, 'fit_time_std': 0.032384969255539235, 'score_time_mean': 0.10741496086120605, 'score_time_std': 0.0012465199424455708, 'test_score_mean': 0.9446835443037976, 'test_score_std': 0.03766947497186954}, 'fit_time': 2.4866180419921875, 'time_this_iter_s': 17.19045615196228, 'should_checkpoint': True, 'done': True, 'timesteps_total': None, 'episodes_total': None, 'training_iteration': 1, 'trial_id': '564d9_00000', 'experiment_id': '200cbc1e2b84434882732d2053ec45c2', 'date': '2022-05-19_11-56-51', 'timestamp': 1652957811, 'time_total_s': 17.19045615196228, 'pid': 12221, 'hostname': 'Kais-MacBook-Pro.local', 'node_ip': '127.0.0.1', 'config': {}, 'time_since_restore': 17.19045615196228, 'timesteps_since_restore': 0, 'iterations_since_restore': 1, 'warmup_time': 0.0039539337158203125, 'experiment_tag': '0'}\n"
+      "{'valid': {'score_time': 0.03549623489379883, 'test_score': 0.9532163742690059}, 'cv': {'fit_time': array([2.22100377, 2.21548939, 2.20756745, 2.22235131, 2.31238961]), 'score_time': array([0.02246499, 0.02308655, 0.02564836, 0.02913785, 0.02122164]), 'test_score': array([0.9625    , 0.9125    , 0.9875    , 1.        , 0.93670886]), 'fit_time_mean': 2.235760307312012, 'fit_time_std': 0.03866614559685742, 'score_time_mean': 0.02431187629699707, 'score_time_std': 0.0028120522003997595, 'test_score_mean': 0.9598417721518986, 'test_score_std': 0.032128186960552516}, 'fit_time': 2.3157050609588623, 'time_this_iter_s': 15.684244871139526, 'should_checkpoint': True, 'done': True, 'timesteps_total': None, 'episodes_total': None, 'training_iteration': 1, 'trial_id': '9dec8_00000', 'experiment_id': 'f8215019c10e4a81ba2187c38e875365', 'date': '2022-06-22_17-27-59', 'timestamp': 1655918879, 'time_total_s': 15.684244871139526, 'pid': 1492629, 'hostname': 'ip-172-31-43-110', 'node_ip': '172.31.43.110', 'config': {}, 'time_since_restore': 15.684244871139526, 'timesteps_since_restore': 0, 'iterations_since_restore': 1, 'warmup_time': 0.0057866573333740234, 'experiment_tag': '0'}\n"
      ]
     }
    ],
@@ -396,7 +350,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 14,
    "id": "24b16ede",
    "metadata": {
     "pycharm": {
@@ -408,8 +362,10 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "Map Progress (1 actors 1 pending): 100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1/1 [00:01<00:00,  1.59s/it]\n",
-      "Map_Batches: 100%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1/1 [00:00<00:00, 95.33it/s]"
+      "2022-06-22 17:27:59,658\tWARNING read_api.py:260 -- The number of blocks in this dataset (1) limits its parallelism to 1 concurrent tasks. This is much less than the number of available CPU slots in the cluster. Use `.repartition(n)` to increase the number of dataset blocks.\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 64.73it/s]\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.60s/it]\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 71.41it/s]"
      ]
     },
     {
@@ -417,20 +373,26 @@
      "output_type": "stream",
      "text": [
       "PREDICTED LABELS\n",
-      "     predictions\n",
-      "0              1\n",
-      "1              1\n",
-      "2              1\n",
-      "3              1\n",
-      "4              1\n",
-      "..           ...\n",
-      "166            1\n",
-      "167            1\n",
-      "168            0\n",
-      "169            0\n",
-      "170            1\n",
-      "\n",
-      "[171 rows x 1 columns]\n"
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n"
      ]
     },
     {
@@ -453,7 +415,7 @@
    "notebook_metadata_filter": "-all"
   },
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "Python 3.8.10 ('venv': venv)",
    "language": "python",
    "name": "python3"
   },
@@ -467,9 +429,14 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.10"
+  },
+  "vscode": {
+   "interpreter": {
+    "hash": "3c0d54d489a08ae47a06eae2fd00ff032d6cddb527c382959b7b2575f6a8167f"
+   }
   }
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
\ No newline at end of file
+}
diff --git a/doc/source/ray-air/examples/upload_to_comet_ml.ipynb b/doc/source/ray-air/examples/upload_to_comet_ml.ipynb
index 934368789a6a..35cfec99eaaa 100644
--- a/doc/source/ray-air/examples/upload_to_comet_ml.ipynb
+++ b/doc/source/ray-air/examples/upload_to_comet_ml.ipynb
@@ -49,8 +49,7 @@
     "from ray.air import RunConfig\n",
     "from ray.air.result import Result\n",
     "from ray.train.xgboost import XGBoostTrainer\n",
-    "from ray.tune.integration.comet import CometLoggerCallback\n",
-    "from sklearn.datasets import load_breast_cancer"
+    "from ray.tune.integration.comet import CometLoggerCallback"
    ]
   },
   {
@@ -69,11 +68,8 @@
    "outputs": [],
    "source": [
     "def get_train_dataset() -> ray.data.Dataset:\n",
-    "    \"\"\"Return the \"Breast cancer\" dataset as a Ray dataset.\"\"\"\n",
-    "    data_raw = load_breast_cancer(as_frame=True)\n",
-    "    df = data_raw[\"data\"]\n",
-    "    df[\"target\"] = data_raw[\"target\"]\n",
-    "    return ray.data.from_pandas(df)"
+    "    dataset = ray.data.read_csv(\"s3://air-example-data/breast_cancer.csv\")\n",
+    "    return dataset"
    ]
   },
   {
diff --git a/doc/source/ray-air/examples/upload_to_wandb.ipynb b/doc/source/ray-air/examples/upload_to_wandb.ipynb
index 48cb51065b5d..58e8463b13da 100644
--- a/doc/source/ray-air/examples/upload_to_wandb.ipynb
+++ b/doc/source/ray-air/examples/upload_to_wandb.ipynb
@@ -49,8 +49,7 @@
     "from ray.air import RunConfig\n",
     "from ray.air.result import Result\n",
     "from ray.train.xgboost import XGBoostTrainer\n",
-    "from ray.tune.integration.wandb import WandbLoggerCallback\n",
-    "from sklearn.datasets import load_breast_cancer"
+    "from ray.tune.integration.wandb import WandbLoggerCallback"
    ]
   },
   {
@@ -69,11 +68,8 @@
    "outputs": [],
    "source": [
     "def get_train_dataset() -> ray.data.Dataset:\n",
-    "    \"\"\"Return the \"Breast cancer\" dataset as a Ray dataset.\"\"\"\n",
-    "    data_raw = load_breast_cancer(as_frame=True)\n",
-    "    df = data_raw[\"data\"]\n",
-    "    df[\"target\"] = data_raw[\"target\"]\n",
-    "    return ray.data.from_pandas(df)"
+    "    dataset = ray.data.read_csv(\"s3://air-example-data/breast_cancer.csv\")\n",
+    "    return dataset"
    ]
   },
   {
diff --git a/doc/source/ray-air/examples/xgboost_example.ipynb b/doc/source/ray-air/examples/xgboost_example.ipynb
index 601bb3db6de6..892647f6d9c3 100644
--- a/doc/source/ray-air/examples/xgboost_example.ipynb
+++ b/doc/source/ray-air/examples/xgboost_example.ipynb
@@ -27,7 +27,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": null,
    "id": "41f20cc1",
    "metadata": {
     "pycharm": {
@@ -53,25 +53,33 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 1,
    "id": "7232303d",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "  from pandas import MultiIndex, Int64Index\n",
+      "FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n"
+     ]
+    }
+   ],
    "source": [
-    "import argparse\n",
     "from typing import Tuple\n",
     "\n",
-    "import pandas as pd\n",
-    "\n",
     "import ray\n",
     "from ray.train.batch_predictor import BatchPredictor\n",
     "from ray.train.xgboost import XGBoostPredictor\n",
     "from ray.train.xgboost import XGBoostTrainer\n",
     "from ray.data.dataset import Dataset\n",
     "from ray.air.result import Result\n",
-    "from ray.data.preprocessors import StandardScaler\n",
-    "from sklearn.datasets import load_breast_cancer\n",
-    "from sklearn.model_selection import train_test_split"
+    "from ray.air.util.datasets import train_test_split\n",
+    "from ray.data.preprocessors import StandardScaler"
    ]
   },
   {
@@ -88,19 +96,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 2,
    "id": "37c4f38f",
    "metadata": {},
    "outputs": [],
    "source": [
     "def prepare_data() -> Tuple[Dataset, Dataset, Dataset]:\n",
-    "    data_raw = load_breast_cancer()\n",
-    "    dataset_df = pd.DataFrame(data_raw[\"data\"], columns=data_raw[\"feature_names\"])\n",
-    "    dataset_df[\"target\"] = data_raw[\"target\"]\n",
-    "    train_df, test_df = train_test_split(dataset_df, test_size=0.3)\n",
-    "    train_dataset = ray.data.from_pandas(train_df)\n",
-    "    valid_dataset = ray.data.from_pandas(test_df)\n",
-    "    test_dataset = ray.data.from_pandas(test_df.drop(\"target\", axis=1))\n",
+    "    dataset = ray.data.read_csv(\"s3://air-example-data/breast_cancer.csv\")\n",
+    "    train_dataset, valid_dataset = train_test_split(dataset, test_size=0.3)\n",
+    "    test_dataset = valid_dataset.map_batches(lambda df: df.drop(\"target\", axis=1), batch_format=\"pandas\")\n",
     "    return train_dataset, valid_dataset, test_dataset"
    ]
   },
@@ -118,7 +122,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 3,
    "id": "dae8998d",
    "metadata": {
     "pycharm": {
@@ -168,7 +172,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 4,
    "id": "5b8076d3",
    "metadata": {
     "pycharm": {
@@ -187,14 +191,13 @@
     "    predicted_labels = (\n",
     "        batch_predictor.predict(test_dataset)\n",
     "        .map_batches(lambda df: (df > 0.5).astype(int), batch_format=\"pandas\")\n",
-    "        .to_pandas(limit=float(\"inf\"))\n",
     "    )\n",
-    "    print(f\"PREDICTED LABELS\\n{predicted_labels}\")\n",
+    "    print(f\"PREDICTED LABELS\")\n",
+    "    predicted_labels.show()\n",
     "\n",
-    "    shap_values = batch_predictor.predict(test_dataset, pred_contribs=True).to_pandas(\n",
-    "        limit=float(\"inf\")\n",
-    "    )\n",
-    "    print(f\"SHAP VALUES\\n{shap_values}\")\n"
+    "    shap_values = batch_predictor.predict(test_dataset, pred_contribs=True)\n",
+    "    print(f\"SHAP VALUES\")\n",
+    "    shap_values.show()\n"
    ]
   },
   {
@@ -207,7 +210,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 5,
    "id": "0f96d62b",
    "metadata": {
     "pycharm": {
@@ -219,18 +222,20 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-19 11:44:42,413\tINFO services.py:1483 -- View the Ray dashboard at \u001B[1m\u001B[32mhttp://127.0.0.1:8265\u001B[39m\u001B[22m\n"
+      "2022-06-22 17:28:55,841\tINFO services.py:1477 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8270\u001b[39m\u001b[22m\n",
+      "2022-06-22 17:28:58,044\tWARNING read_api.py:260 -- The number of blocks in this dataset (1) limits its parallelism to 1 concurrent tasks. This is much less than the number of available CPU slots in the cluster. Use `.repartition(n)` to increase the number of dataset blocks.\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 40.28it/s]\n"
      ]
     },
     {
      "data": {
       "text/html": [
-       "== Status ==<br>Current time: 2022-05-19 11:45:00 (running for 00:00:13.93)<br>Memory usage on this node: 10.3/16.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/4.5 GiB heap, 0.0/2.0 GiB objects<br>Result logdir: /Users/kai/ray_results/XGBoostTrainer_2022-05-19_11-44-45<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
+       "== Status ==<br>Current time: 2022-06-22 17:29:15 (running for 00:00:16.11)<br>Memory usage on this node: 11.5/31.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/8 CPUs, 0/0 GPUs, 0.0/12.35 GiB heap, 0.0/6.18 GiB objects<br>Result logdir: /home/ubuntu/ray_results/XGBoostTrainer_2022-06-22_17-28-58<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
        "<thead>\n",
-       "<tr><th>Trial name                </th><th>status    </th><th>loc            </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  train-logloss</th><th style=\"text-align: right;\">  train-error</th><th style=\"text-align: right;\">  valid-logloss</th></tr>\n",
+       "<tr><th>Trial name                </th><th>status    </th><th>loc                  </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  train-logloss</th><th style=\"text-align: right;\">  train-error</th><th style=\"text-align: right;\">  valid-logloss</th></tr>\n",
        "</thead>\n",
        "<tbody>\n",
-       "<tr><td>XGBoostTrainer_b273b_00000</td><td>TERMINATED</td><td>127.0.0.1:11036</td><td style=\"text-align: right;\">   100</td><td style=\"text-align: right;\">         9.03935</td><td style=\"text-align: right;\">       0.005949</td><td style=\"text-align: right;\">            0</td><td style=\"text-align: right;\">        0.07483</td></tr>\n",
+       "<tr><td>XGBoostTrainer_cc863_00000</td><td>TERMINATED</td><td>172.31.43.110:1493910</td><td style=\"text-align: right;\">   100</td><td style=\"text-align: right;\">         12.5164</td><td style=\"text-align: right;\">       0.005874</td><td style=\"text-align: right;\">            0</td><td style=\"text-align: right;\">       0.078188</td></tr>\n",
        "</tbody>\n",
        "</table><br><br>"
       ],
@@ -245,47 +250,68 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:44:47,554\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=54067 --object-store-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=61242 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:61017 --redis-password=5241590000000000 --startup-token=16 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:44:51,603\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=54067 --object-store-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=61242 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:61017 --redis-password=5241590000000000 --startup-token=17 --runtime-env-hash=-2010331069\n",
-      "\u001B[2m\u001B[36m(GBDTTrainable pid=11036)\u001B[0m UserWarning: Dataset 'train' has 1 blocks, which is less than the `num_workers` 2. This dataset will be automatically repartitioned to 2 blocks.\n",
-      "\u001B[2m\u001B[36m(GBDTTrainable pid=11036)\u001B[0m UserWarning: Dataset 'valid' has 1 blocks, which is less than the `num_workers` 2. This dataset will be automatically repartitioned to 2 blocks.\n",
-      "\u001B[2m\u001B[36m(GBDTTrainable pid=11036)\u001B[0m 2022-05-19 11:44:53,035\tINFO main.py:980 -- [RayXGBoost] Created 2 new actors (2 total actors). Waiting until actors are ready for training.\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:44:54,085\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=54067 --object-store-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=61242 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:61017 --redis-password=5241590000000000 --startup-token=18 --runtime-env-hash=-2010331069\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:44:54,106\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=54067 --object-store-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=61242 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:61017 --redis-password=5241590000000000 --startup-token=19 --runtime-env-hash=-2010331069\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:44:54,252\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=54067 --object-store-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=61242 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:61017 --redis-password=5241590000000000 --startup-token=21 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:44:54,266\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=54067 --object-store-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=61242 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:61017 --redis-password=5241590000000000 --startup-token=23 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:44:54,266\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=54067 --object-store-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=61242 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:61017 --redis-password=5241590000000000 --startup-token=20 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[33m(raylet)\u001B[0m 2022-05-19 11:44:54,271\tINFO context.py:70 -- Exec'ing worker with command: exec /Users/kai/.pyenv/versions/3.7.7/bin/python3.7 /Users/kai/coding/ray/python/ray/workers/default_worker.py --node-ip-address=127.0.0.1 --node-manager-port=54067 --object-store-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/plasma_store --raylet-name=/tmp/ray/session_2022-05-19_11-44-39_813259_10959/sockets/raylet --redis-address=None --storage=None --temp-dir=/tmp/ray --metrics-agent-port=61242 --logging-rotate-bytes=536870912 --logging-rotate-backup-count=5 --gcs-address=127.0.0.1:61017 --redis-password=5241590000000000 --startup-token=22 --runtime-env-hash=-2010331134\n",
-      "\u001B[2m\u001B[36m(GBDTTrainable pid=11036)\u001B[0m 2022-05-19 11:44:56,874\tINFO main.py:1025 -- [RayXGBoost] Starting XGBoost training.\n",
-      "\u001B[2m\u001B[36m(_RemoteRayXGBoostActor pid=11104)\u001B[0m [11:44:56] task [xgboost.ray]:4517180944 got new rank 1\n",
-      "\u001B[2m\u001B[36m(_RemoteRayXGBoostActor pid=11103)\u001B[0m [11:44:56] task [xgboost.ray]:4655847056 got new rank 0\n"
+      "\u001b[2m\u001b[36m(pid=1493910)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1493910)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(pid=1493910)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1493910)\u001b[0m FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1493910)\u001b[0m FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(XGBoostTrainer pid=1493910)\u001b[0m UserWarning: Dataset 'train' has 1 blocks, which is less than the `num_workers` 2. This dataset will be automatically repartitioned to 2 blocks.\n",
+      "\u001b[2m\u001b[36m(XGBoostTrainer pid=1493910)\u001b[0m UserWarning: Dataset 'valid' has 1 blocks, which is less than the `num_workers` 2. This dataset will be automatically repartitioned to 2 blocks.\n",
+      "\u001b[2m\u001b[36m(XGBoostTrainer pid=1493910)\u001b[0m 2022-06-22 17:29:04,073\tINFO main.py:980 -- [RayXGBoost] Created 2 new actors (2 total actors). Waiting until actors are ready for training.\n",
+      "\u001b[2m\u001b[36m(pid=1494007)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494007)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(pid=1494008)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494008)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(pid=1494009)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494009)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(pid=1494007)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494007)\u001b[0m FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494007)\u001b[0m FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494008)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494008)\u001b[0m FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494008)\u001b[0m FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(_RemoteRayXGBoostActor pid=1494008)\u001b[0m 2022-06-22 17:29:07,324\tWARNING __init__.py:190 -- DeprecationWarning: `ray.worker.get_resource_ids` is a private attribute and access will be removed in a future Ray version.\n",
+      "\u001b[2m\u001b[36m(pid=1494009)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494009)\u001b[0m FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494009)\u001b[0m FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(_RemoteRayXGBoostActor pid=1494009)\u001b[0m 2022-06-22 17:29:07,421\tWARNING __init__.py:190 -- DeprecationWarning: `ray.worker.get_resource_ids` is a private attribute and access will be removed in a future Ray version.\n",
+      "\u001b[2m\u001b[36m(XGBoostTrainer pid=1493910)\u001b[0m 2022-06-22 17:29:07,874\tINFO main.py:1025 -- [RayXGBoost] Starting XGBoost training.\n",
+      "\u001b[2m\u001b[36m(_RemoteRayXGBoostActor pid=1494008)\u001b[0m [17:29:07] task [xgboost.ray]:139731353900128 got new rank 0\n",
+      "\u001b[2m\u001b[36m(_RemoteRayXGBoostActor pid=1494008)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(_RemoteRayXGBoostActor pid=1494009)\u001b[0m [17:29:07] task [xgboost.ray]:140076138558608 got new rank 1\n",
+      "\u001b[2m\u001b[36m(_RemoteRayXGBoostActor pid=1494009)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1494006)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1494006)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1494006)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1494006)\u001b[0m FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(_QueueActor pid=1494006)\u001b[0m FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Result for XGBoostTrainer_b273b_00000:\n",
-      "  date: 2022-05-19_11-44-57\n",
+      "Result for XGBoostTrainer_cc863_00000:\n",
+      "  date: 2022-06-22_17-29-09\n",
       "  done: false\n",
-      "  experiment_id: 991235d8b76649398688695ca70a08e4\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
+      "  experiment_id: dc3dac01a34043cfb5751907e2bc648e\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 11036\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1493910\n",
       "  should_checkpoint: true\n",
-      "  time_since_restore: 7.17207407951355\n",
-      "  time_this_iter_s: 7.17207407951355\n",
-      "  time_total_s: 7.17207407951355\n",
-      "  timestamp: 1652957097\n",
+      "  time_since_restore: 7.967940330505371\n",
+      "  time_this_iter_s: 7.967940330505371\n",
+      "  time_total_s: 7.967940330505371\n",
+      "  timestamp: 1655918949\n",
       "  timesteps_since_restore: 0\n",
-      "  train-error: 0.020101\n",
-      "  train-logloss: 0.465715\n",
+      "  train-error: 0.017588\n",
+      "  train-logloss: 0.464648\n",
       "  training_iteration: 1\n",
-      "  trial_id: b273b_00000\n",
-      "  valid-error: 0.052632\n",
-      "  valid-logloss: 0.480831\n",
-      "  warmup_time: 0.003935098648071289\n",
+      "  trial_id: cc863_00000\n",
+      "  valid-error: 0.081871\n",
+      "  valid-logloss: 0.496374\n",
+      "  warmup_time: 0.004768848419189453\n",
       "  \n"
      ]
     },
@@ -293,35 +319,35 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "\u001B[2m\u001B[36m(GBDTTrainable pid=11036)\u001B[0m 2022-05-19 11:44:59,796\tINFO main.py:1519 -- [RayXGBoost] Finished XGBoost training on training data with total N=398 in 6.80 seconds (2.92 pure XGBoost training time).\n"
+      "\u001b[2m\u001b[36m(XGBoostTrainer pid=1493910)\u001b[0m 2022-06-22 17:29:14,546\tINFO main.py:1516 -- [RayXGBoost] Finished XGBoost training on training data with total N=398 in 10.52 seconds (6.66 pure XGBoost training time).\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Result for XGBoostTrainer_b273b_00000:\n",
-      "  date: 2022-05-19_11-44-59\n",
+      "Result for XGBoostTrainer_cc863_00000:\n",
+      "  date: 2022-06-22_17-29-14\n",
       "  done: true\n",
-      "  experiment_id: 991235d8b76649398688695ca70a08e4\n",
+      "  experiment_id: dc3dac01a34043cfb5751907e2bc648e\n",
       "  experiment_tag: '0'\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
+      "  hostname: ip-172-31-43-110\n",
       "  iterations_since_restore: 100\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 11036\n",
+      "  node_ip: 172.31.43.110\n",
+      "  pid: 1493910\n",
       "  should_checkpoint: true\n",
-      "  time_since_restore: 9.03934907913208\n",
-      "  time_this_iter_s: 0.018042802810668945\n",
-      "  time_total_s: 9.03934907913208\n",
-      "  timestamp: 1652957099\n",
+      "  time_since_restore: 12.516392230987549\n",
+      "  time_this_iter_s: 0.03008890151977539\n",
+      "  time_total_s: 12.516392230987549\n",
+      "  timestamp: 1655918954\n",
       "  timesteps_since_restore: 0\n",
       "  train-error: 0.0\n",
-      "  train-logloss: 0.005949\n",
+      "  train-logloss: 0.005874\n",
       "  training_iteration: 100\n",
-      "  trial_id: b273b_00000\n",
-      "  valid-error: 0.017544\n",
-      "  valid-logloss: 0.07483\n",
-      "  warmup_time: 0.003935098648071289\n",
+      "  trial_id: cc863_00000\n",
+      "  valid-error: 0.040936\n",
+      "  valid-logloss: 0.078188\n",
+      "  warmup_time: 0.004768848419189453\n",
       "  \n"
      ]
     },
@@ -329,14 +355,14 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-05-19 11:45:00,535\tINFO tune.py:753 -- Total run time: 15.30 seconds (13.91 seconds for the tuning loop).\n"
+      "2022-06-22 17:29:15,362\tINFO tune.py:734 -- Total run time: 16.94 seconds (16.08 seconds for the tuning loop).\n"
      ]
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "{'train-logloss': 0.005949, 'train-error': 0.0, 'valid-logloss': 0.07483, 'valid-error': 0.017544, 'time_this_iter_s': 0.018042802810668945, 'should_checkpoint': True, 'done': True, 'timesteps_total': None, 'episodes_total': None, 'training_iteration': 100, 'trial_id': 'b273b_00000', 'experiment_id': '991235d8b76649398688695ca70a08e4', 'date': '2022-05-19_11-44-59', 'timestamp': 1652957099, 'time_total_s': 9.03934907913208, 'pid': 11036, 'hostname': 'Kais-MacBook-Pro.local', 'node_ip': '127.0.0.1', 'config': {}, 'time_since_restore': 9.03934907913208, 'timesteps_since_restore': 0, 'iterations_since_restore': 100, 'warmup_time': 0.003935098648071289, 'experiment_tag': '0'}\n"
+      "{'train-logloss': 0.005874, 'train-error': 0.0, 'valid-logloss': 0.078188, 'valid-error': 0.040936, 'time_this_iter_s': 0.03008890151977539, 'should_checkpoint': True, 'done': True, 'timesteps_total': None, 'episodes_total': None, 'training_iteration': 100, 'trial_id': 'cc863_00000', 'experiment_id': 'dc3dac01a34043cfb5751907e2bc648e', 'date': '2022-06-22_17-29-14', 'timestamp': 1655918954, 'time_total_s': 12.516392230987549, 'pid': 1493910, 'hostname': 'ip-172-31-43-110', 'node_ip': '172.31.43.110', 'config': {}, 'time_since_restore': 12.516392230987549, 'timesteps_since_restore': 0, 'iterations_since_restore': 100, 'warmup_time': 0.004768848419189453, 'experiment_tag': '0'}\n"
      ]
     }
    ],
@@ -354,7 +380,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 6,
    "id": "283b1dba",
    "metadata": {
     "pycharm": {
@@ -366,8 +392,16 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "Map Progress (1 actors 1 pending): 100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1/1 [00:01<00:00,  1.96s/it]\n",
-      "Map_Batches: 100%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1/1 [00:00<00:00, 87.81it/s]\n"
+      "2022-06-22 17:29:16,463\tWARNING read_api.py:260 -- The number of blocks in this dataset (1) limits its parallelism to 1 concurrent tasks. This is much less than the number of available CPU slots in the cluster. Use `.repartition(n)` to increase the number of dataset blocks.\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 46.14it/s]\n",
+      "Map_Batches:   0%|          | 0/1 [00:00<?, ?it/s]\u001b[2m\u001b[36m(pid=1494373)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494373)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(pid=1494373)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494373)\u001b[0m FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494373)\u001b[0m FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.90s/it]\n",
+      "\u001b[2m\u001b[36m(BlockWorker pid=1494373)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 75.10it/s]\n"
      ]
     },
     {
@@ -375,27 +409,43 @@
      "output_type": "stream",
      "text": [
       "PREDICTED LABELS\n",
-      "     predictions\n",
-      "0              0\n",
-      "1              0\n",
-      "2              1\n",
-      "3              1\n",
-      "4              0\n",
-      "..           ...\n",
-      "166            1\n",
-      "167            1\n",
-      "168            0\n",
-      "169            1\n",
-      "170            0\n",
-      "\n",
-      "[171 rows x 1 columns]\n"
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 0}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 1}\n",
+      "{'predictions': 0}\n"
      ]
     },
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "Map Progress (1 actors 1 pending): 100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1/1 [00:01<00:00,  1.78s/it]"
+      "Map_Batches:   0%|          | 0/1 [00:00<?, ?it/s]\u001b[2m\u001b[36m(pid=1494403)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494403)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(pid=1494413)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494413)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(pid=1494403)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494403)\u001b[0m FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494403)\u001b[0m FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494413)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494413)\u001b[0m FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494413)\u001b[0m FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:01<00:00,  1.88s/it]"
      ]
     },
     {
@@ -403,72 +453,26 @@
      "output_type": "stream",
      "text": [
       "SHAP VALUES\n",
-      "     predictions_0  predictions_1  predictions_2  predictions_3  \\\n",
-      "0        -0.139882      -0.748878            0.0      -1.143079   \n",
-      "1         0.013840      -1.053747            0.0       0.361219   \n",
-      "2        -0.082575       0.952107            0.0       0.396908   \n",
-      "3         0.016314       0.916166            0.0       0.535740   \n",
-      "4        -0.087534       1.317693            0.0      -0.631737   \n",
-      "..             ...            ...            ...            ...   \n",
-      "166       0.016314       1.006091            0.0       0.535740   \n",
-      "167       0.010002       0.948294            0.0       0.529942   \n",
-      "168      -0.084481       0.766085            0.0      -0.582221   \n",
-      "169       0.010002       0.846374            0.0       0.502846   \n",
-      "170      -0.108186      -1.032712            0.0      -0.737255   \n",
-      "\n",
-      "     predictions_4  predictions_5  predictions_6  predictions_7  \\\n",
-      "0         0.228545       0.074653      -0.033109      -1.680274   \n",
-      "1        -0.386373       0.030964      -0.026341      -1.796480   \n",
-      "2         0.294464       0.142708       0.151952       1.859482   \n",
-      "3         0.224681      -0.013640       0.062032       0.909347   \n",
-      "4        -0.123310      -0.008267      -0.081633      -1.907682   \n",
-      "..             ...            ...            ...            ...   \n",
-      "166       0.224681      -0.013640       0.062032       0.890978   \n",
-      "167      -0.107441       0.143260       0.062032       1.149335   \n",
-      "168      -0.164466       0.088426      -0.081633      -1.767637   \n",
-      "169      -0.112530       0.029944      -0.074865       0.963479   \n",
-      "170      -0.250381       0.034186      -0.033109      -1.654185   \n",
-      "\n",
-      "     predictions_8  predictions_9  ...  predictions_21  predictions_22  \\\n",
-      "0        -0.173504      -0.027610  ...       -0.373735       -1.117443   \n",
-      "1         0.153518       0.018295  ...       -0.798841        0.277471   \n",
-      "2         0.153518       0.029338  ...        1.314059       -0.455756   \n",
-      "3         0.153518       0.015659  ...        0.816392        0.683619   \n",
-      "4        -0.173504       0.009200  ...        1.207632       -0.945986   \n",
-      "..             ...            ...  ...             ...             ...   \n",
-      "166      -0.173504       0.015659  ...        0.856858        0.704448   \n",
-      "167       0.153518       0.010089  ...        1.203512        0.708437   \n",
-      "168       0.153518       0.014880  ...       -0.418931       -1.201489   \n",
-      "169       0.153518       0.010089  ...        1.211174        0.600757   \n",
-      "170       0.153518       0.016329  ...       -0.556651       -1.009517   \n",
-      "\n",
-      "     predictions_23  predictions_24  predictions_25  predictions_26  \\\n",
-      "0         -1.207984        0.349734        0.018222       -0.725013   \n",
-      "1          0.075934       -0.990557       -0.012509       -0.863824   \n",
-      "2          0.137665        0.668639       -0.042249       -0.684045   \n",
-      "3          0.766776        0.575949        0.022816        1.013024   \n",
-      "4         -0.577419       -0.454616        0.051755       -0.861906   \n",
-      "..              ...             ...             ...             ...   \n",
-      "166        0.754576        0.573718        0.022816        0.948516   \n",
-      "167        1.066871        0.487933        0.056155       -0.601421   \n",
-      "168       -1.310177       -0.386367        0.018222       -0.837832   \n",
-      "169        1.009837        0.694783       -0.042249       -0.626939   \n",
-      "170       -1.149971       -0.386467       -0.006737       -0.750287   \n",
-      "\n",
-      "     predictions_27  predictions_28  predictions_29  predictions_30  \n",
-      "0         -1.149301        0.374839             0.0        1.046286  \n",
-      "1         -2.501725       -0.492608             0.0        1.046286  \n",
-      "2          0.077563       -0.106669             0.0        1.046286  \n",
-      "3          0.757272        0.341423             0.0        1.046286  \n",
-      "4         -0.800213        0.400311             0.0        1.046286  \n",
-      "..              ...             ...             ...             ...  \n",
-      "166        0.757272        0.061695             0.0        1.046286  \n",
-      "167        0.610080       -0.339797             0.0        1.046286  \n",
-      "168       -1.300907       -0.474622             0.0        1.046286  \n",
-      "169        0.238948       -0.361304             0.0        1.046286  \n",
-      "170       -1.241549       -0.370570             0.0        1.046286  \n",
-      "\n",
-      "[171 rows x 31 columns]\n"
+      "{'predictions_0': 0.009930070489645004, 'predictions_1': 0.546318531036377, 'predictions_2': -0.006533853709697723, 'predictions_3': 0.022934239357709885, 'predictions_4': 0.32817941904067993, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.013881205581128597, 'predictions_7': 0.568859875202179, 'predictions_8': -0.27460771799087524, 'predictions_9': 0.013218197971582413, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.04015672579407692, 'predictions_12': 0.11667086184024811, 'predictions_13': 0.9853533506393433, 'predictions_14': 0.05529181659221649, 'predictions_15': -0.005734208971261978, 'predictions_16': -0.0008497871458530426, 'predictions_17': 0.16138489544391632, 'predictions_18': -0.36162295937538147, 'predictions_19': 0.003658014815300703, 'predictions_20': 0.393682062625885, 'predictions_21': 0.6647266149520874, 'predictions_22': 1.7201099395751953, 'predictions_23': 0.35084351897239685, 'predictions_24': 0.4841834604740143, 'predictions_25': 0.013311417773365974, 'predictions_26': 0.8087116479873657, 'predictions_27': 0.5730299353599548, 'predictions_28': 0.1818174123764038, 'predictions_29': 0.1068669781088829, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.009930070489645004, 'predictions_1': 0.39265793561935425, 'predictions_2': -0.007271876558661461, 'predictions_3': 0.022934239357709885, 'predictions_4': -0.06737710535526276, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.04250117391347885, 'predictions_7': 0.7946916222572327, 'predictions_8': 0.30412089824676514, 'predictions_9': 0.013218197971582413, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.04129280149936676, 'predictions_12': -0.012254374101758003, 'predictions_13': 0.2327558547258377, 'predictions_14': 0.05529181659221649, 'predictions_15': 0.6405980587005615, 'predictions_16': -0.0014769809786230326, 'predictions_17': 0.16138489544391632, 'predictions_18': -0.3877210319042206, 'predictions_19': -0.0022315792739391327, 'predictions_20': 0.3209536671638489, 'predictions_21': -0.018735788762569427, 'predictions_22': 1.482913851737976, 'predictions_23': 0.3135913908481598, 'predictions_24': 0.5150958299636841, 'predictions_25': 0.013311417773365974, 'predictions_26': 1.0875523090362549, 'predictions_27': 0.7323897480964661, 'predictions_28': 0.12313760071992874, 'predictions_29': 0.1068669781088829, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': -0.01911582238972187, 'predictions_1': -0.41554388403892517, 'predictions_2': -0.0034923271741718054, 'predictions_3': -0.06306137144565582, 'predictions_4': -0.3192429542541504, 'predictions_5': -0.009094981476664543, 'predictions_6': -0.08258295059204102, 'predictions_7': -0.8088644742965698, 'predictions_8': 0.2545676529407501, 'predictions_9': 0.015295587480068207, 'predictions_10': 0.0021318818908184767, 'predictions_11': -0.003732672892510891, 'predictions_12': -0.054907385259866714, 'predictions_13': -0.9062053561210632, 'predictions_14': -0.029618918895721436, 'predictions_15': 0.4303477704524994, 'predictions_16': -0.007885736413300037, 'predictions_17': 0.17541413009166718, 'predictions_18': -0.3190936744213104, 'predictions_19': 0.0024438181426376104, 'predictions_20': -0.6092430353164673, 'predictions_21': -0.3519248068332672, 'predictions_22': -2.2588469982147217, 'predictions_23': -0.569831371307373, 'predictions_24': -1.0422284603118896, 'predictions_25': -0.031086977571249008, 'predictions_26': -0.5648106932640076, 'predictions_27': -1.0225528478622437, 'predictions_28': -0.1411924958229065, 'predictions_29': -0.1724514663219452, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.009930070489645004, 'predictions_1': 0.5999099016189575, 'predictions_2': -0.007271876558661461, 'predictions_3': 0.022934239357709885, 'predictions_4': 0.31011122465133667, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.013881205581128597, 'predictions_7': 0.5183905363082886, 'predictions_8': -0.27460771799087524, 'predictions_9': -0.015900276601314545, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.04129280149936676, 'predictions_12': 0.11667086184024811, 'predictions_13': 1.0816324949264526, 'predictions_14': -0.01614229381084442, 'predictions_15': -0.23922261595726013, 'predictions_16': -0.0008497871458530426, 'predictions_17': 0.16138489544391632, 'predictions_18': -0.36162295937538147, 'predictions_19': -0.0022315792739391327, 'predictions_20': 0.3189953863620758, 'predictions_21': 0.6754519939422607, 'predictions_22': 1.513157606124878, 'predictions_23': 0.35084351897239685, 'predictions_24': 0.09065212309360504, 'predictions_25': 0.013311417773365974, 'predictions_26': 1.039388656616211, 'predictions_27': 0.5762963891029358, 'predictions_28': 0.1816803514957428, 'predictions_29': 0.1068669781088829, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.009930070489645004, 'predictions_1': 0.41290122270584106, 'predictions_2': -0.007271876558661461, 'predictions_3': 0.04113232344388962, 'predictions_4': 0.4761468768119812, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.04250117391347885, 'predictions_7': 0.6889638304710388, 'predictions_8': 0.30412089824676514, 'predictions_9': -0.00703495554625988, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.04129280149936676, 'predictions_12': -0.012254374101758003, 'predictions_13': 0.8955986499786377, 'predictions_14': 0.05529181659221649, 'predictions_15': 0.6405980587005615, 'predictions_16': -0.0010774275287985802, 'predictions_17': 0.16581103205680847, 'predictions_18': 0.4200459420681, 'predictions_19': 0.003658014815300703, 'predictions_20': 0.31559276580810547, 'predictions_21': 0.08991634845733643, 'predictions_22': 1.374340295791626, 'predictions_23': 0.4179628789424896, 'predictions_24': 0.6432731747627258, 'predictions_25': 0.013311417773365974, 'predictions_26': 1.0250954627990723, 'predictions_27': 0.6740144491195679, 'predictions_28': -0.12222569435834885, 'predictions_29': 0.1068669781088829, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.009930070489645004, 'predictions_1': 0.6223654747009277, 'predictions_2': -0.007271876558661461, 'predictions_3': 0.04113232344388962, 'predictions_4': 0.030091704800724983, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.04250117391347885, 'predictions_7': 0.520163893699646, 'predictions_8': -0.13476626574993134, 'predictions_9': 0.013218197971582413, 'predictions_10': 0.004969821777194738, 'predictions_11': 0.04129280149936676, 'predictions_12': 0.11667086184024811, 'predictions_13': 1.0668600797653198, 'predictions_14': -0.46553897857666016, 'predictions_15': -0.06545835733413696, 'predictions_16': -0.0010774275287985802, 'predictions_17': 0.16138489544391632, 'predictions_18': 0.406240850687027, 'predictions_19': -0.004930071532726288, 'predictions_20': 0.303047239780426, 'predictions_21': 0.7582043409347534, 'predictions_22': 1.4096102714538574, 'predictions_23': 0.43191614747047424, 'predictions_24': 0.47695621848106384, 'predictions_25': 0.013311417773365974, 'predictions_26': 1.0482016801834106, 'predictions_27': 0.5110929608345032, 'predictions_28': -0.12222569435834885, 'predictions_29': 0.1068669781088829, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.009930070489645004, 'predictions_1': 0.5661754012107849, 'predictions_2': -0.0019909553229808807, 'predictions_3': 0.04113232344388962, 'predictions_4': 0.292957067489624, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.013881205581128597, 'predictions_7': 0.6406195759773254, 'predictions_8': -0.27460771799087524, 'predictions_9': -0.007835762575268745, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.04129280149936676, 'predictions_12': -0.012254374101758003, 'predictions_13': 0.21169273555278778, 'predictions_14': -0.02233714796602726, 'predictions_15': -0.9655348658561707, 'predictions_16': -0.0010828523663803935, 'predictions_17': 0.16581103205680847, 'predictions_18': 0.4200459420681, 'predictions_19': -0.0022315792739391327, 'predictions_20': 0.3136344850063324, 'predictions_21': 0.7264875173568726, 'predictions_22': 1.5534507036209106, 'predictions_23': 0.41967567801475525, 'predictions_24': 0.41908225417137146, 'predictions_25': 0.013311417773365974, 'predictions_26': 1.0032241344451904, 'predictions_27': 0.6091798543930054, 'predictions_28': 0.18174558877944946, 'predictions_29': 0.08268986642360687, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.009930070489645004, 'predictions_1': 0.40430790185928345, 'predictions_2': -0.007271876558661461, 'predictions_3': 0.04113232344388962, 'predictions_4': -0.33117765188217163, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.013881205581128597, 'predictions_7': 0.737379252910614, 'predictions_8': -0.27460771799087524, 'predictions_9': 0.007771771401166916, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.04129280149936676, 'predictions_12': -0.012254374101758003, 'predictions_13': 0.18173672258853912, 'predictions_14': -0.02233714796602726, 'predictions_15': 0.6811268329620361, 'predictions_16': -0.0014769809786230326, 'predictions_17': 0.16581103205680847, 'predictions_18': 0.406240850687027, 'predictions_19': -0.0022315792739391327, 'predictions_20': 0.31559276580810547, 'predictions_21': -0.031238339841365814, 'predictions_22': 1.7573171854019165, 'predictions_23': 0.3838556110858917, 'predictions_24': 0.14492939412593842, 'predictions_25': 0.013311417773365974, 'predictions_26': 1.1148661375045776, 'predictions_27': 0.7173758149147034, 'predictions_28': 0.18174558877944946, 'predictions_29': 0.1068669781088829, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': -0.11485510319471359, 'predictions_1': 0.8875605463981628, 'predictions_2': -0.05685592442750931, 'predictions_3': -0.06306137144565582, 'predictions_4': 0.013515152037143707, 'predictions_5': 0.0024520084261894226, 'predictions_6': 0.04250117391347885, 'predictions_7': 0.4688224792480469, 'predictions_8': -0.14307911694049835, 'predictions_9': -0.06901921331882477, 'predictions_10': 0.003290211781859398, 'predictions_11': 0.003781725186854601, 'predictions_12': 0.08078579604625702, 'predictions_13': 0.8216619491577148, 'predictions_14': 0.0463210791349411, 'predictions_15': -0.13255546987056732, 'predictions_16': -0.0010776874842122197, 'predictions_17': 0.21504947543144226, 'predictions_18': -0.27619078755378723, 'predictions_19': -0.0025743553414940834, 'predictions_20': -0.9275118112564087, 'predictions_21': 1.0307989120483398, 'predictions_22': -2.7721312046051025, 'predictions_23': -0.4765593707561493, 'predictions_24': 0.5464398264884949, 'predictions_25': 0.004862718749791384, 'predictions_26': -0.619586706161499, 'predictions_27': -0.2188473790884018, 'predictions_28': 0.10512445122003555, 'predictions_29': 0.1068669781088829, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.0011090459302067757, 'predictions_1': -0.5595121383666992, 'predictions_2': -0.002613282995298505, 'predictions_3': 0.04113232344388962, 'predictions_4': 0.5254822969436646, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.013881205581128597, 'predictions_7': 0.5551156997680664, 'predictions_8': -0.27460771799087524, 'predictions_9': 0.013218197971582413, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.03278094530105591, 'predictions_12': -0.012305313721299171, 'predictions_13': -1.6061651706695557, 'predictions_14': -0.01887715980410576, 'predictions_15': 0.6405980587005615, 'predictions_16': -0.0014769809786230326, 'predictions_17': -0.1776299774646759, 'predictions_18': 0.4914793074131012, 'predictions_19': 0.014222224242985249, 'predictions_20': 0.311679869890213, 'predictions_21': -0.08892179280519485, 'predictions_22': 1.5504939556121826, 'predictions_23': 0.5073927044868469, 'predictions_24': 0.6315706968307495, 'predictions_25': 0.005095706321299076, 'predictions_26': 0.7821602821350098, 'predictions_27': 0.7409825325012207, 'predictions_28': 0.1818174123764038, 'predictions_29': 0.07541733235120773, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': -0.01911582238972187, 'predictions_1': -0.41529545187950134, 'predictions_2': -0.0034923271741718054, 'predictions_3': -0.06306137144565582, 'predictions_4': -0.3192429542541504, 'predictions_5': 0.0166567862033844, 'predictions_6': -0.08258295059204102, 'predictions_7': -0.8088644742965698, 'predictions_8': 0.2545676529407501, 'predictions_9': 0.015658268705010414, 'predictions_10': 0.0021318818908184767, 'predictions_11': -0.003732672892510891, 'predictions_12': -0.054124802350997925, 'predictions_13': -1.0786054134368896, 'predictions_14': -0.03029802441596985, 'predictions_15': 0.46246394515037537, 'predictions_16': -0.007885736413300037, 'predictions_17': -0.168026864528656, 'predictions_18': -0.3190936744213104, 'predictions_19': 0.0024438181426376104, 'predictions_20': -0.6661943197250366, 'predictions_21': -0.2179996222257614, 'predictions_22': -2.689664125442505, 'predictions_23': -0.569831371307373, 'predictions_24': -0.6587631106376648, 'predictions_25': -0.031086977571249008, 'predictions_26': -0.554345428943634, 'predictions_27': -0.9785504937171936, 'predictions_28': -0.14026358723640442, 'predictions_29': 0.08221252262592316, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.009930070489645004, 'predictions_1': 0.46925264596939087, 'predictions_2': -0.007271876558661461, 'predictions_3': 0.04113232344388962, 'predictions_4': 0.49770334362983704, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.04250117391347885, 'predictions_7': 0.7922263741493225, 'predictions_8': 0.30412089824676514, 'predictions_9': -0.020953189581632614, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.04129280149936676, 'predictions_12': 0.10843253135681152, 'predictions_13': 0.21460701525211334, 'predictions_14': -0.01614229381084442, 'predictions_15': 0.6405980587005615, 'predictions_16': -0.0014769809786230326, 'predictions_17': 0.16581103205680847, 'predictions_18': 0.4200459420681, 'predictions_19': -0.004930071532726288, 'predictions_20': 0.31877532601356506, 'predictions_21': -0.01986948773264885, 'predictions_22': 1.556177020072937, 'predictions_23': 0.445791631937027, 'predictions_24': 0.5183241367340088, 'predictions_25': 0.013311417773365974, 'predictions_26': 1.139808177947998, 'predictions_27': 0.5462087988853455, 'predictions_28': -0.12236276268959045, 'predictions_29': 0.1068669781088829, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.009930070489645004, 'predictions_1': 0.4225478768348694, 'predictions_2': -0.007271876558661461, 'predictions_3': 0.022934239357709885, 'predictions_4': 0.38781455159187317, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.013881205581128597, 'predictions_7': 0.6254116892814636, 'predictions_8': -0.28174325823783875, 'predictions_9': 0.008572578430175781, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.022453438490629196, 'predictions_12': 0.09116627275943756, 'predictions_13': 1.01081383228302, 'predictions_14': 0.051560889929533005, 'predictions_15': -0.7526140809059143, 'predictions_16': -0.0010774275287985802, 'predictions_17': 0.13414263725280762, 'predictions_18': -0.36162295937538147, 'predictions_19': -0.004930071532726288, 'predictions_20': 0.21481025218963623, 'predictions_21': -1.7817566394805908, 'predictions_22': 1.5544458627700806, 'predictions_23': 0.37933894991874695, 'predictions_24': -0.5005015134811401, 'predictions_25': 0.013311417773365974, 'predictions_26': 1.2116931676864624, 'predictions_27': 0.44261839985847473, 'predictions_28': -0.1333807408809662, 'predictions_29': 0.12356309592723846, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.009930070489645004, 'predictions_1': 0.383541464805603, 'predictions_2': -0.007271876558661461, 'predictions_3': 0.022934239357709885, 'predictions_4': -0.2877747118473053, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.04250117391347885, 'predictions_7': 0.7181150317192078, 'predictions_8': -0.13476626574993134, 'predictions_9': 0.008572578430175781, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.04129280149936676, 'predictions_12': 0.11661991477012634, 'predictions_13': 1.1911046504974365, 'predictions_14': 0.05529181659221649, 'predictions_15': -0.9263618588447571, 'predictions_16': -0.0010774275287985802, 'predictions_17': 0.16138489544391632, 'predictions_18': -0.3877210319042206, 'predictions_19': -0.0022315792739391327, 'predictions_20': 0.33373206853866577, 'predictions_21': -0.10588698834180832, 'predictions_22': 1.7216718196868896, 'predictions_23': 0.33134832978248596, 'predictions_24': 0.07947567105293274, 'predictions_25': 0.013311417773365974, 'predictions_26': 1.1455278396606445, 'predictions_27': 0.6355651617050171, 'predictions_28': -0.12222569435834885, 'predictions_29': 0.08268986642360687, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.0006543132476508617, 'predictions_1': -0.9144008159637451, 'predictions_2': -0.002613282995298505, 'predictions_3': 0.04113232344388962, 'predictions_4': 0.3871055543422699, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.013881205581128597, 'predictions_7': 0.6403470635414124, 'predictions_8': -0.27460771799087524, 'predictions_9': 0.05645249783992767, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.02168312668800354, 'predictions_12': 0.11661991477012634, 'predictions_13': 1.00325608253479, 'predictions_14': 0.0834161564707756, 'predictions_15': 0.6231592893600464, 'predictions_16': -0.0010774275287985802, 'predictions_17': 0.16138489544391632, 'predictions_18': 0.37865450978279114, 'predictions_19': 0.014222224242985249, 'predictions_20': 0.38761574029922485, 'predictions_21': -0.02124016545712948, 'predictions_22': 1.7526684999465942, 'predictions_23': 0.5112042427062988, 'predictions_24': 0.5034342408180237, 'predictions_25': 0.005095706321299076, 'predictions_26': 0.9831169843673706, 'predictions_27': 0.6794330477714539, 'predictions_28': 0.1802661120891571, 'predictions_29': 0.1068669781088829, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': -0.0415695421397686, 'predictions_1': -1.239405870437622, 'predictions_2': 0.017459018155932426, 'predictions_3': 0.04113232344388962, 'predictions_4': 0.4762759208679199, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.04250117391347885, 'predictions_7': 0.9339500665664673, 'predictions_8': 0.2958080470561981, 'predictions_9': 0.07594440132379532, 'predictions_10': 0.003290211781859398, 'predictions_11': 0.01872287504374981, 'predictions_12': -0.047330088913440704, 'predictions_13': 0.056555308401584625, 'predictions_14': 0.05581967905163765, 'predictions_15': 0.6933314800262451, 'predictions_16': -0.0023022573441267014, 'predictions_17': 0.13856875896453857, 'predictions_18': 0.3069765865802765, 'predictions_19': 0.06924822926521301, 'predictions_20': -0.34636712074279785, 'predictions_21': -0.8682994246482849, 'predictions_22': -0.9693347215652466, 'predictions_23': -0.4783455729484558, 'predictions_24': 0.8846019506454468, 'predictions_25': -0.053959351032972336, 'predictions_26': -0.5963033437728882, 'predictions_27': -0.5447815656661987, 'predictions_28': -0.14065201580524445, 'predictions_29': 0.1068669781088829, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': -0.024941062554717064, 'predictions_1': -1.5298322439193726, 'predictions_2': 0.01525309681892395, 'predictions_3': -0.11309991031885147, 'predictions_4': 0.5172238945960999, 'predictions_5': 0.0024520084261894226, 'predictions_6': 0.04250117391347885, 'predictions_7': 0.5354383587837219, 'predictions_8': 0.2944106459617615, 'predictions_9': -0.0466727539896965, 'predictions_10': 0.003290211781859398, 'predictions_11': 0.0188205074518919, 'predictions_12': -0.051007892936468124, 'predictions_13': -1.3502459526062012, 'predictions_14': -0.033535201102495193, 'predictions_15': 0.10678261518478394, 'predictions_16': -0.0014769809786230326, 'predictions_17': 0.13856875896453857, 'predictions_18': 0.3855004608631134, 'predictions_19': -0.008676297031342983, 'predictions_20': -0.3423697352409363, 'predictions_21': -0.8320394158363342, 'predictions_22': -0.677459716796875, 'predictions_23': -0.5385064482688904, 'predictions_24': 0.49956056475639343, 'predictions_25': 0.005095706321299076, 'predictions_26': 1.6938838958740234, 'predictions_27': 0.842454195022583, 'predictions_28': -0.14346282184123993, 'predictions_29': 0.07541733235120773, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.009930070489645004, 'predictions_1': -0.27544116973876953, 'predictions_2': -0.002613282995298505, 'predictions_3': 0.04113232344388962, 'predictions_4': -0.055784229189157486, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.04250117391347885, 'predictions_7': 0.6722134947776794, 'predictions_8': 0.30412089824676514, 'predictions_9': 0.007771771401166916, 'predictions_10': 0.009325551800429821, 'predictions_11': 0.022453438490629196, 'predictions_12': 0.10843253135681152, 'predictions_13': 0.8989681005477905, 'predictions_14': -0.02233714796602726, 'predictions_15': 0.5417506694793701, 'predictions_16': -0.0010774275287985802, 'predictions_17': 0.16581103205680847, 'predictions_18': 0.406240850687027, 'predictions_19': -0.004930071532726288, 'predictions_20': 0.31123194098472595, 'predictions_21': -0.0816090777516365, 'predictions_22': 2.1133084297180176, 'predictions_23': 0.4506610333919525, 'predictions_24': -0.7193129658699036, 'predictions_25': 0.013311417773365974, 'predictions_26': 1.1290695667266846, 'predictions_27': 0.6277202367782593, 'predictions_28': -0.12229753285646439, 'predictions_29': 0.1477402150630951, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': 0.0006543132476508617, 'predictions_1': -0.8427131175994873, 'predictions_2': -0.002613282995298505, 'predictions_3': 0.04113232344388962, 'predictions_4': -0.2789610028266907, 'predictions_5': 0.004407345782965422, 'predictions_6': 0.04250117391347885, 'predictions_7': 0.7143340706825256, 'predictions_8': 0.30412089824676514, 'predictions_9': 0.0335814394056797, 'predictions_10': 0.009325551800429821, 'predictions_11': -0.11305594444274902, 'predictions_12': -0.018516669049859047, 'predictions_13': 0.10892590880393982, 'predictions_14': -0.08540848642587662, 'predictions_15': -0.09607099741697311, 'predictions_16': -0.0014769809786230326, 'predictions_17': 0.13856875896453857, 'predictions_18': 0.44763222336769104, 'predictions_19': 0.014222224242985249, 'predictions_20': 0.33993175625801086, 'predictions_21': -0.6289445757865906, 'predictions_22': 1.987050175666809, 'predictions_23': 0.5226719379425049, 'predictions_24': -0.6285008788108826, 'predictions_25': 0.003129873890429735, 'predictions_26': 1.1616733074188232, 'predictions_27': 0.8699957132339478, 'predictions_28': -0.12550924718379974, 'predictions_29': 0.1477402150630951, 'predictions_30': 0.5059375166893005}\n",
+      "{'predictions_0': -0.01911582238972187, 'predictions_1': -0.41529545187950134, 'predictions_2': -0.0034923271741718054, 'predictions_3': -0.11309991031885147, 'predictions_4': -0.30164235830307007, 'predictions_5': -0.009094981476664543, 'predictions_6': -0.08258295059204102, 'predictions_7': -0.8088644742965698, 'predictions_8': 0.2545676529407501, 'predictions_9': 0.015658268705010414, 'predictions_10': -0.08612797409296036, 'predictions_11': -0.003732672892510891, 'predictions_12': -0.24946996569633484, 'predictions_13': -0.9515364766120911, 'predictions_14': -0.030668942257761955, 'predictions_15': 0.4303477704524994, 'predictions_16': -0.007885736413300037, 'predictions_17': -0.168026864528656, 'predictions_18': 0.25735917687416077, 'predictions_19': 0.0024438181426376104, 'predictions_20': -0.5780957937240601, 'predictions_21': -0.3737794756889343, 'predictions_22': -2.412389039993286, 'predictions_23': -0.6488395929336548, 'predictions_24': -0.6861838698387146, 'predictions_25': -0.031086977571249008, 'predictions_26': -0.5648106932640076, 'predictions_27': -0.9229058623313904, 'predictions_28': -0.14026358723640442, 'predictions_29': -0.1724514663219452, 'predictions_30': 0.5059375166893005}\n"
      ]
     },
     {
@@ -477,6 +481,18 @@
      "text": [
       "\n"
      ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\u001b[2m\u001b[36m(BlockWorker pid=1494413)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494469)\u001b[0m /home/ubuntu/ray/venv/lib/python3.8/site-packages/xgboost/compat.py:31: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494469)\u001b[0m   from pandas import MultiIndex, Int64Index\n",
+      "\u001b[2m\u001b[36m(pid=1494469)\u001b[0m FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494469)\u001b[0m FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n",
+      "\u001b[2m\u001b[36m(pid=1494469)\u001b[0m FutureWarning: pandas.UInt64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n"
+     ]
     }
    ],
    "source": [
@@ -491,7 +507,7 @@
    "notebook_metadata_filter": "-all"
   },
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "Python 3.8.10 ('venv': venv)",
    "language": "python",
    "name": "python3"
   },
@@ -505,9 +521,14 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.10"
+  },
+  "vscode": {
+   "interpreter": {
+    "hash": "3c0d54d489a08ae47a06eae2fd00ff032d6cddb527c382959b7b2575f6a8167f"
+   }
   }
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
\ No newline at end of file
+}
diff --git a/python/ray/air/examples/huggingface/huggingface_basic_language_modeling_example.py b/python/ray/air/examples/huggingface/huggingface_basic_language_modeling_example.py
index df7f1655aa00..251183bed51a 100644
--- a/python/ray/air/examples/huggingface/huggingface_basic_language_modeling_example.py
+++ b/python/ray/air/examples/huggingface/huggingface_basic_language_modeling_example.py
@@ -127,9 +127,8 @@ def train_function(train_dataset, eval_dataset=None, **config):
     )
     data = ray.data.from_pandas(pd.DataFrame(prompt, columns=["prompt"]))
     prediction = predictor.predict(data, num_gpus_per_worker=int(use_gpu))
-    prediction = prediction.to_pandas().iloc[0]["generated_text"]
 
-    print(f"Generated text for prompt '{prompt}': '{prediction}'")
+    print(f"Generated text for prompt '{prompt}': '{prediction.take(1)}'")
 
 
 if __name__ == "__main__":
diff --git a/python/ray/air/examples/tf/tensorflow_linear_dataset_example.py b/python/ray/air/examples/tf/tensorflow_linear_dataset_example.py
index 44ba34b30be9..c38afc61c92c 100644
--- a/python/ray/air/examples/tf/tensorflow_linear_dataset_example.py
+++ b/python/ray/air/examples/tf/tensorflow_linear_dataset_example.py
@@ -99,9 +99,8 @@ def predict_linear(result: Result) -> Dataset:
 
     predictions = batch_predictor.predict(prediction_dataset, dtype=tf.float32)
 
-    pandas_predictions = predictions.to_pandas(float("inf"))
-
-    print(f"PREDICTIONS\n{pandas_predictions}")
+    print("PREDICTIONS")
+    predictions.show()
 
     return predictions
 

From 2c8de938e6e8e501a1c0dbde3d0098a3ffd74405 Mon Sep 17 00:00:00 2001
From: Antoni Baum <antoni.baum@protonmail.com>
Date: Fri, 24 Jun 2022 15:34:36 +0000
Subject: [PATCH 2/2] Implement feedback from code review

---
 doc/source/ray-air/doc_code/air_key_concepts.py | 4 +---
 doc/source/ray-air/doc_code/preprocessors.py    | 4 ++--
 doc/source/ray-air/doc_code/tf_starter.py       | 2 +-
 doc/source/ray-air/doc_code/xgboost_starter.py  | 8 +++-----
 4 files changed, 7 insertions(+), 11 deletions(-)

diff --git a/doc/source/ray-air/doc_code/air_key_concepts.py b/doc/source/ray-air/doc_code/air_key_concepts.py
index 42727433751b..df71a98dea2a 100644
--- a/doc/source/ray-air/doc_code/air_key_concepts.py
+++ b/doc/source/ray-air/doc_code/air_key_concepts.py
@@ -75,9 +75,7 @@
 batch_predictor = BatchPredictor.from_checkpoint(result.checkpoint, XGBoostPredictor)
 
 # Bulk batch prediction.
-predicted_labels = batch_predictor.predict(test_dataset).map_batches(
-    lambda df: (df > 0.5).astype(int), batch_format="pandas"
-)
+predicted_probabilities = batch_predictor.predict(test_dataset)
 
 # Pipelined batch prediction: instead of processing the data in bulk, process it
 # incrementally in windows of the given size.
diff --git a/doc/source/ray-air/doc_code/preprocessors.py b/doc/source/ray-air/doc_code/preprocessors.py
index 1c19f08d2b8f..bd533f46a23c 100644
--- a/doc/source/ray-air/doc_code/preprocessors.py
+++ b/doc/source/ray-air/doc_code/preprocessors.py
@@ -88,8 +88,8 @@
 test_dataset = ray.data.from_items([{"x": x} for x in range(2, 32, 3)])
 
 batch_predictor = BatchPredictor.from_checkpoint(checkpoint, XGBoostPredictor)
-predicted_labels = batch_predictor.predict(test_dataset)
-predicted_labels.show()
+predicted_probabilities = batch_predictor.predict(test_dataset)
+predicted_probabilities.show()
 # {'predictions': 0.09843720495700836}
 # {'predictions': 5.604666709899902}
 # {'predictions': 11.405311584472656}
diff --git a/doc/source/ray-air/doc_code/tf_starter.py b/doc/source/ray-air/doc_code/tf_starter.py
index 360503294fdc..4116ff5dba58 100644
--- a/doc/source/ray-air/doc_code/tf_starter.py
+++ b/doc/source/ray-air/doc_code/tf_starter.py
@@ -105,7 +105,7 @@ def train_func(config: dict):
 
 predictions = batch_predictor.predict(prediction_dataset, dtype=tf.float32)
 
-print(f"PREDICTIONS")
+print("PREDICTIONS")
 predictions.show()
 
 # __air_tf_batchpred_end__
diff --git a/doc/source/ray-air/doc_code/xgboost_starter.py b/doc/source/ray-air/doc_code/xgboost_starter.py
index f2e7a3793d95..1d917178e691 100644
--- a/doc/source/ray-air/doc_code/xgboost_starter.py
+++ b/doc/source/ray-air/doc_code/xgboost_starter.py
@@ -59,11 +59,9 @@
 
 batch_predictor = BatchPredictor.from_checkpoint(result.checkpoint, XGBoostPredictor)
 
-predicted_labels = batch_predictor.predict(test_dataset).map_batches(
-    lambda df: (df > 0.5).astype(int), batch_format="pandas"
-)
-print("PREDICTED LABELS")
-predicted_labels.show()
+predicted_probabilities = batch_predictor.predict(test_dataset)
+print("PREDICTED PROBABILITIES")
+predicted_probabilities.show()
 
 shap_values = batch_predictor.predict(test_dataset, pred_contribs=True)
 print("SHAP VALUES")